1 //===-- MachODump.cpp - Object file dumping utility for llvm --------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file implements the MachO-specific dumper for llvm-objdump.
12 //===----------------------------------------------------------------------===//
14 #include "llvm/Object/MachO.h"
15 #include "llvm-objdump.h"
16 #include "llvm-c/Disassembler.h"
17 #include "llvm/ADT/STLExtras.h"
18 #include "llvm/ADT/StringExtras.h"
19 #include "llvm/ADT/Triple.h"
20 #include "llvm/Config/config.h"
21 #include "llvm/DebugInfo/DIContext.h"
22 #include "llvm/DebugInfo/DWARF/DWARFContext.h"
23 #include "llvm/Demangle/Demangle.h"
24 #include "llvm/MC/MCAsmInfo.h"
25 #include "llvm/MC/MCContext.h"
26 #include "llvm/MC/MCDisassembler/MCDisassembler.h"
27 #include "llvm/MC/MCInst.h"
28 #include "llvm/MC/MCInstPrinter.h"
29 #include "llvm/MC/MCInstrDesc.h"
30 #include "llvm/MC/MCInstrInfo.h"
31 #include "llvm/MC/MCRegisterInfo.h"
32 #include "llvm/MC/MCSubtargetInfo.h"
33 #include "llvm/Object/MachOUniversal.h"
34 #include "llvm/Support/Casting.h"
35 #include "llvm/Support/CommandLine.h"
36 #include "llvm/Support/Debug.h"
37 #include "llvm/Support/Endian.h"
38 #include "llvm/Support/Format.h"
39 #include "llvm/Support/FormattedStream.h"
40 #include "llvm/Support/GraphWriter.h"
41 #include "llvm/Support/LEB128.h"
42 #include "llvm/Support/MachO.h"
43 #include "llvm/Support/MemoryBuffer.h"
44 #include "llvm/Support/TargetRegistry.h"
45 #include "llvm/Support/TargetSelect.h"
46 #include "llvm/Support/ToolOutputFile.h"
47 #include "llvm/Support/raw_ostream.h"
50 #include <system_error>
59 using namespace object;
63 cl::desc("Print line information from debug info if available"));
65 static cl::opt<std::string> DSYMFile("dsym",
66 cl::desc("Use .dSYM file for debug info"));
68 static cl::opt<bool> FullLeadingAddr("full-leading-addr",
69 cl::desc("Print full leading address"));
71 static cl::opt<bool> NoLeadingAddr("no-leading-addr",
72 cl::desc("Print no leading address"));
74 static cl::opt<bool> NoLeadingHeaders("no-leading-headers",
75 cl::desc("Print no leading headers"));
77 cl::opt<bool> llvm::UniversalHeaders("universal-headers",
78 cl::desc("Print Mach-O universal headers "
79 "(requires -macho)"));
82 llvm::ArchiveHeaders("archive-headers",
83 cl::desc("Print archive headers for Mach-O archives "
84 "(requires -macho)"));
87 ArchiveMemberOffsets("archive-member-offsets",
88 cl::desc("Print the offset to each archive member for "
89 "Mach-O archives (requires -macho and "
90 "-archive-headers)"));
93 llvm::IndirectSymbols("indirect-symbols",
94 cl::desc("Print indirect symbol table for Mach-O "
95 "objects (requires -macho)"));
98 llvm::DataInCode("data-in-code",
99 cl::desc("Print the data in code table for Mach-O objects "
100 "(requires -macho)"));
103 llvm::LinkOptHints("link-opt-hints",
104 cl::desc("Print the linker optimization hints for "
105 "Mach-O objects (requires -macho)"));
108 llvm::InfoPlist("info-plist",
109 cl::desc("Print the info plist section as strings for "
110 "Mach-O objects (requires -macho)"));
113 llvm::DylibsUsed("dylibs-used",
114 cl::desc("Print the shared libraries used for linked "
115 "Mach-O files (requires -macho)"));
118 llvm::DylibId("dylib-id",
119 cl::desc("Print the shared library's id for the dylib Mach-O "
120 "file (requires -macho)"));
123 llvm::NonVerbose("non-verbose",
124 cl::desc("Print the info for Mach-O objects in "
125 "non-verbose or numeric form (requires -macho)"));
128 llvm::ObjcMetaData("objc-meta-data",
129 cl::desc("Print the Objective-C runtime meta data for "
130 "Mach-O files (requires -macho)"));
132 cl::opt<std::string> llvm::DisSymName(
134 cl::desc("disassemble just this symbol's instructions (requires -macho)"));
136 static cl::opt<bool> NoSymbolicOperands(
137 "no-symbolic-operands",
138 cl::desc("do not symbolic operands when disassembling (requires -macho)"));
140 static cl::list<std::string>
141 ArchFlags("arch", cl::desc("architecture(s) from a Mach-O file to dump"),
144 bool ArchAll = false;
146 static std::string ThumbTripleName;
148 static const Target *GetTarget(const MachOObjectFile *MachOObj,
149 const char **McpuDefault,
150 const Target **ThumbTarget) {
151 // Figure out the target triple.
152 llvm::Triple TT(TripleName);
153 if (TripleName.empty()) {
154 TT = MachOObj->getArchTriple(McpuDefault);
155 TripleName = TT.str();
158 if (TT.getArch() == Triple::arm) {
159 // We've inferred a 32-bit ARM target from the object file. All MachO CPUs
160 // that support ARM are also capable of Thumb mode.
161 llvm::Triple ThumbTriple = TT;
162 std::string ThumbName = (Twine("thumb") + TT.getArchName().substr(3)).str();
163 ThumbTriple.setArchName(ThumbName);
164 ThumbTripleName = ThumbTriple.str();
167 // Get the target specific parser.
169 const Target *TheTarget = TargetRegistry::lookupTarget(TripleName, Error);
170 if (TheTarget && ThumbTripleName.empty())
173 *ThumbTarget = TargetRegistry::lookupTarget(ThumbTripleName, Error);
177 errs() << "llvm-objdump: error: unable to get target for '";
179 errs() << TripleName;
181 errs() << ThumbTripleName;
182 errs() << "', see --version and --triple.\n";
186 struct SymbolSorter {
187 bool operator()(const SymbolRef &A, const SymbolRef &B) {
188 Expected<SymbolRef::Type> ATypeOrErr = A.getType();
190 report_error(A.getObject()->getFileName(), ATypeOrErr.takeError());
191 SymbolRef::Type AType = *ATypeOrErr;
192 Expected<SymbolRef::Type> BTypeOrErr = B.getType();
194 report_error(B.getObject()->getFileName(), BTypeOrErr.takeError());
195 SymbolRef::Type BType = *BTypeOrErr;
196 uint64_t AAddr = (AType != SymbolRef::ST_Function) ? 0 : A.getValue();
197 uint64_t BAddr = (BType != SymbolRef::ST_Function) ? 0 : B.getValue();
198 return AAddr < BAddr;
202 // Types for the storted data in code table that is built before disassembly
203 // and the predicate function to sort them.
204 typedef std::pair<uint64_t, DiceRef> DiceTableEntry;
205 typedef std::vector<DiceTableEntry> DiceTable;
206 typedef DiceTable::iterator dice_table_iterator;
208 // This is used to search for a data in code table entry for the PC being
209 // disassembled. The j parameter has the PC in j.first. A single data in code
210 // table entry can cover many bytes for each of its Kind's. So if the offset,
211 // aka the i.first value, of the data in code table entry plus its Length
212 // covers the PC being searched for this will return true. If not it will
214 static bool compareDiceTableEntries(const DiceTableEntry &i,
215 const DiceTableEntry &j) {
217 i.second.getLength(Length);
219 return j.first >= i.first && j.first < i.first + Length;
222 static uint64_t DumpDataInCode(const uint8_t *bytes, uint64_t Length,
223 unsigned short Kind) {
224 uint32_t Value, Size = 1;
228 case MachO::DICE_KIND_DATA:
231 dumpBytes(makeArrayRef(bytes, 4), outs());
232 Value = bytes[3] << 24 | bytes[2] << 16 | bytes[1] << 8 | bytes[0];
233 outs() << "\t.long " << Value;
235 } else if (Length >= 2) {
237 dumpBytes(makeArrayRef(bytes, 2), outs());
238 Value = bytes[1] << 8 | bytes[0];
239 outs() << "\t.short " << Value;
243 dumpBytes(makeArrayRef(bytes, 2), outs());
245 outs() << "\t.byte " << Value;
248 if (Kind == MachO::DICE_KIND_DATA)
249 outs() << "\t@ KIND_DATA\n";
251 outs() << "\t@ data in code kind = " << Kind << "\n";
253 case MachO::DICE_KIND_JUMP_TABLE8:
255 dumpBytes(makeArrayRef(bytes, 1), outs());
257 outs() << "\t.byte " << format("%3u", Value) << "\t@ KIND_JUMP_TABLE8\n";
260 case MachO::DICE_KIND_JUMP_TABLE16:
262 dumpBytes(makeArrayRef(bytes, 2), outs());
263 Value = bytes[1] << 8 | bytes[0];
264 outs() << "\t.short " << format("%5u", Value & 0xffff)
265 << "\t@ KIND_JUMP_TABLE16\n";
268 case MachO::DICE_KIND_JUMP_TABLE32:
269 case MachO::DICE_KIND_ABS_JUMP_TABLE32:
271 dumpBytes(makeArrayRef(bytes, 4), outs());
272 Value = bytes[3] << 24 | bytes[2] << 16 | bytes[1] << 8 | bytes[0];
273 outs() << "\t.long " << Value;
274 if (Kind == MachO::DICE_KIND_JUMP_TABLE32)
275 outs() << "\t@ KIND_JUMP_TABLE32\n";
277 outs() << "\t@ KIND_ABS_JUMP_TABLE32\n";
284 static void getSectionsAndSymbols(MachOObjectFile *MachOObj,
285 std::vector<SectionRef> &Sections,
286 std::vector<SymbolRef> &Symbols,
287 SmallVectorImpl<uint64_t> &FoundFns,
288 uint64_t &BaseSegmentAddress) {
289 for (const SymbolRef &Symbol : MachOObj->symbols()) {
290 Expected<StringRef> SymName = Symbol.getName();
292 report_error(MachOObj->getFileName(), SymName.takeError());
293 if (!SymName->startswith("ltmp"))
294 Symbols.push_back(Symbol);
297 for (const SectionRef &Section : MachOObj->sections()) {
299 Section.getName(SectName);
300 Sections.push_back(Section);
303 bool BaseSegmentAddressSet = false;
304 for (const auto &Command : MachOObj->load_commands()) {
305 if (Command.C.cmd == MachO::LC_FUNCTION_STARTS) {
306 // We found a function starts segment, parse the addresses for later
308 MachO::linkedit_data_command LLC =
309 MachOObj->getLinkeditDataLoadCommand(Command);
311 MachOObj->ReadULEB128s(LLC.dataoff, FoundFns);
312 } else if (Command.C.cmd == MachO::LC_SEGMENT) {
313 MachO::segment_command SLC = MachOObj->getSegmentLoadCommand(Command);
314 StringRef SegName = SLC.segname;
315 if (!BaseSegmentAddressSet && SegName != "__PAGEZERO") {
316 BaseSegmentAddressSet = true;
317 BaseSegmentAddress = SLC.vmaddr;
323 static void PrintIndirectSymbolTable(MachOObjectFile *O, bool verbose,
324 uint32_t n, uint32_t count,
325 uint32_t stride, uint64_t addr) {
326 MachO::dysymtab_command Dysymtab = O->getDysymtabLoadCommand();
327 uint32_t nindirectsyms = Dysymtab.nindirectsyms;
328 if (n > nindirectsyms)
329 outs() << " (entries start past the end of the indirect symbol "
330 "table) (reserved1 field greater than the table size)";
331 else if (n + count > nindirectsyms)
332 outs() << " (entries extends past the end of the indirect symbol "
335 uint32_t cputype = O->getHeader().cputype;
336 if (cputype & MachO::CPU_ARCH_ABI64)
337 outs() << "address index";
339 outs() << "address index";
344 for (uint32_t j = 0; j < count && n + j < nindirectsyms; j++) {
345 if (cputype & MachO::CPU_ARCH_ABI64)
346 outs() << format("0x%016" PRIx64, addr + j * stride) << " ";
348 outs() << format("0x%08" PRIx32, (uint32_t)addr + j * stride) << " ";
349 MachO::dysymtab_command Dysymtab = O->getDysymtabLoadCommand();
350 uint32_t indirect_symbol = O->getIndirectSymbolTableEntry(Dysymtab, n + j);
351 if (indirect_symbol == MachO::INDIRECT_SYMBOL_LOCAL) {
355 if (indirect_symbol ==
356 (MachO::INDIRECT_SYMBOL_LOCAL | MachO::INDIRECT_SYMBOL_ABS)) {
357 outs() << "LOCAL ABSOLUTE\n";
360 if (indirect_symbol == MachO::INDIRECT_SYMBOL_ABS) {
361 outs() << "ABSOLUTE\n";
364 outs() << format("%5u ", indirect_symbol);
366 MachO::symtab_command Symtab = O->getSymtabLoadCommand();
367 if (indirect_symbol < Symtab.nsyms) {
368 symbol_iterator Sym = O->getSymbolByIndex(indirect_symbol);
369 SymbolRef Symbol = *Sym;
370 Expected<StringRef> SymName = Symbol.getName();
372 report_error(O->getFileName(), SymName.takeError());
382 static void PrintIndirectSymbols(MachOObjectFile *O, bool verbose) {
383 for (const auto &Load : O->load_commands()) {
384 if (Load.C.cmd == MachO::LC_SEGMENT_64) {
385 MachO::segment_command_64 Seg = O->getSegment64LoadCommand(Load);
386 for (unsigned J = 0; J < Seg.nsects; ++J) {
387 MachO::section_64 Sec = O->getSection64(Load, J);
388 uint32_t section_type = Sec.flags & MachO::SECTION_TYPE;
389 if (section_type == MachO::S_NON_LAZY_SYMBOL_POINTERS ||
390 section_type == MachO::S_LAZY_SYMBOL_POINTERS ||
391 section_type == MachO::S_LAZY_DYLIB_SYMBOL_POINTERS ||
392 section_type == MachO::S_THREAD_LOCAL_VARIABLE_POINTERS ||
393 section_type == MachO::S_SYMBOL_STUBS) {
395 if (section_type == MachO::S_SYMBOL_STUBS)
396 stride = Sec.reserved2;
400 outs() << "Can't print indirect symbols for (" << Sec.segname << ","
401 << Sec.sectname << ") "
402 << "(size of stubs in reserved2 field is zero)\n";
405 uint32_t count = Sec.size / stride;
406 outs() << "Indirect symbols for (" << Sec.segname << ","
407 << Sec.sectname << ") " << count << " entries";
408 uint32_t n = Sec.reserved1;
409 PrintIndirectSymbolTable(O, verbose, n, count, stride, Sec.addr);
412 } else if (Load.C.cmd == MachO::LC_SEGMENT) {
413 MachO::segment_command Seg = O->getSegmentLoadCommand(Load);
414 for (unsigned J = 0; J < Seg.nsects; ++J) {
415 MachO::section Sec = O->getSection(Load, J);
416 uint32_t section_type = Sec.flags & MachO::SECTION_TYPE;
417 if (section_type == MachO::S_NON_LAZY_SYMBOL_POINTERS ||
418 section_type == MachO::S_LAZY_SYMBOL_POINTERS ||
419 section_type == MachO::S_LAZY_DYLIB_SYMBOL_POINTERS ||
420 section_type == MachO::S_THREAD_LOCAL_VARIABLE_POINTERS ||
421 section_type == MachO::S_SYMBOL_STUBS) {
423 if (section_type == MachO::S_SYMBOL_STUBS)
424 stride = Sec.reserved2;
428 outs() << "Can't print indirect symbols for (" << Sec.segname << ","
429 << Sec.sectname << ") "
430 << "(size of stubs in reserved2 field is zero)\n";
433 uint32_t count = Sec.size / stride;
434 outs() << "Indirect symbols for (" << Sec.segname << ","
435 << Sec.sectname << ") " << count << " entries";
436 uint32_t n = Sec.reserved1;
437 PrintIndirectSymbolTable(O, verbose, n, count, stride, Sec.addr);
444 static void PrintDataInCodeTable(MachOObjectFile *O, bool verbose) {
445 MachO::linkedit_data_command DIC = O->getDataInCodeLoadCommand();
446 uint32_t nentries = DIC.datasize / sizeof(struct MachO::data_in_code_entry);
447 outs() << "Data in code table (" << nentries << " entries)\n";
448 outs() << "offset length kind\n";
449 for (dice_iterator DI = O->begin_dices(), DE = O->end_dices(); DI != DE;
452 DI->getOffset(Offset);
453 outs() << format("0x%08" PRIx32, Offset) << " ";
455 DI->getLength(Length);
456 outs() << format("%6u", Length) << " ";
461 case MachO::DICE_KIND_DATA:
464 case MachO::DICE_KIND_JUMP_TABLE8:
465 outs() << "JUMP_TABLE8";
467 case MachO::DICE_KIND_JUMP_TABLE16:
468 outs() << "JUMP_TABLE16";
470 case MachO::DICE_KIND_JUMP_TABLE32:
471 outs() << "JUMP_TABLE32";
473 case MachO::DICE_KIND_ABS_JUMP_TABLE32:
474 outs() << "ABS_JUMP_TABLE32";
477 outs() << format("0x%04" PRIx32, Kind);
481 outs() << format("0x%04" PRIx32, Kind);
486 static void PrintLinkOptHints(MachOObjectFile *O) {
487 MachO::linkedit_data_command LohLC = O->getLinkOptHintsLoadCommand();
488 const char *loh = O->getData().substr(LohLC.dataoff, 1).data();
489 uint32_t nloh = LohLC.datasize;
490 outs() << "Linker optimiztion hints (" << nloh << " total bytes)\n";
491 for (uint32_t i = 0; i < nloh;) {
493 uint64_t identifier = decodeULEB128((const uint8_t *)(loh + i), &n);
495 outs() << " identifier " << identifier << " ";
498 switch (identifier) {
500 outs() << "AdrpAdrp\n";
503 outs() << "AdrpLdr\n";
506 outs() << "AdrpAddLdr\n";
509 outs() << "AdrpLdrGotLdr\n";
512 outs() << "AdrpAddStr\n";
515 outs() << "AdrpLdrGotStr\n";
518 outs() << "AdrpAdd\n";
521 outs() << "AdrpLdrGot\n";
524 outs() << "Unknown identifier value\n";
527 uint64_t narguments = decodeULEB128((const uint8_t *)(loh + i), &n);
529 outs() << " narguments " << narguments << "\n";
533 for (uint32_t j = 0; j < narguments; j++) {
534 uint64_t value = decodeULEB128((const uint8_t *)(loh + i), &n);
536 outs() << "\tvalue " << format("0x%" PRIx64, value) << "\n";
543 static void PrintDylibs(MachOObjectFile *O, bool JustId) {
545 for (const auto &Load : O->load_commands()) {
546 if ((JustId && Load.C.cmd == MachO::LC_ID_DYLIB) ||
547 (!JustId && (Load.C.cmd == MachO::LC_ID_DYLIB ||
548 Load.C.cmd == MachO::LC_LOAD_DYLIB ||
549 Load.C.cmd == MachO::LC_LOAD_WEAK_DYLIB ||
550 Load.C.cmd == MachO::LC_REEXPORT_DYLIB ||
551 Load.C.cmd == MachO::LC_LAZY_LOAD_DYLIB ||
552 Load.C.cmd == MachO::LC_LOAD_UPWARD_DYLIB))) {
553 MachO::dylib_command dl = O->getDylibIDLoadCommand(Load);
554 if (dl.dylib.name < dl.cmdsize) {
555 const char *p = (const char *)(Load.Ptr) + dl.dylib.name;
560 outs() << " (compatibility version "
561 << ((dl.dylib.compatibility_version >> 16) & 0xffff) << "."
562 << ((dl.dylib.compatibility_version >> 8) & 0xff) << "."
563 << (dl.dylib.compatibility_version & 0xff) << ",";
564 outs() << " current version "
565 << ((dl.dylib.current_version >> 16) & 0xffff) << "."
566 << ((dl.dylib.current_version >> 8) & 0xff) << "."
567 << (dl.dylib.current_version & 0xff) << ")\n";
570 outs() << "\tBad offset (" << dl.dylib.name << ") for name of ";
571 if (Load.C.cmd == MachO::LC_ID_DYLIB)
572 outs() << "LC_ID_DYLIB ";
573 else if (Load.C.cmd == MachO::LC_LOAD_DYLIB)
574 outs() << "LC_LOAD_DYLIB ";
575 else if (Load.C.cmd == MachO::LC_LOAD_WEAK_DYLIB)
576 outs() << "LC_LOAD_WEAK_DYLIB ";
577 else if (Load.C.cmd == MachO::LC_LAZY_LOAD_DYLIB)
578 outs() << "LC_LAZY_LOAD_DYLIB ";
579 else if (Load.C.cmd == MachO::LC_REEXPORT_DYLIB)
580 outs() << "LC_REEXPORT_DYLIB ";
581 else if (Load.C.cmd == MachO::LC_LOAD_UPWARD_DYLIB)
582 outs() << "LC_LOAD_UPWARD_DYLIB ";
585 outs() << "command " << Index++ << "\n";
591 typedef DenseMap<uint64_t, StringRef> SymbolAddressMap;
593 static void CreateSymbolAddressMap(MachOObjectFile *O,
594 SymbolAddressMap *AddrMap) {
595 // Create a map of symbol addresses to symbol names.
596 for (const SymbolRef &Symbol : O->symbols()) {
597 Expected<SymbolRef::Type> STOrErr = Symbol.getType();
599 report_error(O->getFileName(), STOrErr.takeError());
600 SymbolRef::Type ST = *STOrErr;
601 if (ST == SymbolRef::ST_Function || ST == SymbolRef::ST_Data ||
602 ST == SymbolRef::ST_Other) {
603 uint64_t Address = Symbol.getValue();
604 Expected<StringRef> SymNameOrErr = Symbol.getName();
606 report_error(O->getFileName(), SymNameOrErr.takeError());
607 StringRef SymName = *SymNameOrErr;
608 if (!SymName.startswith(".objc"))
609 (*AddrMap)[Address] = SymName;
614 // GuessSymbolName is passed the address of what might be a symbol and a
615 // pointer to the SymbolAddressMap. It returns the name of a symbol
616 // with that address or nullptr if no symbol is found with that address.
617 static const char *GuessSymbolName(uint64_t value, SymbolAddressMap *AddrMap) {
618 const char *SymbolName = nullptr;
619 // A DenseMap can't lookup up some values.
620 if (value != 0xffffffffffffffffULL && value != 0xfffffffffffffffeULL) {
621 StringRef name = AddrMap->lookup(value);
623 SymbolName = name.data();
628 static void DumpCstringChar(const char c) {
632 outs().write_escaped(p);
635 static void DumpCstringSection(MachOObjectFile *O, const char *sect,
636 uint32_t sect_size, uint64_t sect_addr,
637 bool print_addresses) {
638 for (uint32_t i = 0; i < sect_size; i++) {
639 if (print_addresses) {
641 outs() << format("%016" PRIx64, sect_addr + i) << " ";
643 outs() << format("%08" PRIx64, sect_addr + i) << " ";
645 for (; i < sect_size && sect[i] != '\0'; i++)
646 DumpCstringChar(sect[i]);
647 if (i < sect_size && sect[i] == '\0')
652 static void DumpLiteral4(uint32_t l, float f) {
653 outs() << format("0x%08" PRIx32, l);
654 if ((l & 0x7f800000) != 0x7f800000)
655 outs() << format(" (%.16e)\n", f);
658 outs() << " (+Infinity)\n";
659 else if (l == 0xff800000)
660 outs() << " (-Infinity)\n";
661 else if ((l & 0x00400000) == 0x00400000)
662 outs() << " (non-signaling Not-a-Number)\n";
664 outs() << " (signaling Not-a-Number)\n";
668 static void DumpLiteral4Section(MachOObjectFile *O, const char *sect,
669 uint32_t sect_size, uint64_t sect_addr,
670 bool print_addresses) {
671 for (uint32_t i = 0; i < sect_size; i += sizeof(float)) {
672 if (print_addresses) {
674 outs() << format("%016" PRIx64, sect_addr + i) << " ";
676 outs() << format("%08" PRIx64, sect_addr + i) << " ";
679 memcpy(&f, sect + i, sizeof(float));
680 if (O->isLittleEndian() != sys::IsLittleEndianHost)
681 sys::swapByteOrder(f);
683 memcpy(&l, sect + i, sizeof(uint32_t));
684 if (O->isLittleEndian() != sys::IsLittleEndianHost)
685 sys::swapByteOrder(l);
690 static void DumpLiteral8(MachOObjectFile *O, uint32_t l0, uint32_t l1,
692 outs() << format("0x%08" PRIx32, l0) << " " << format("0x%08" PRIx32, l1);
694 Hi = (O->isLittleEndian()) ? l1 : l0;
695 Lo = (O->isLittleEndian()) ? l0 : l1;
697 // Hi is the high word, so this is equivalent to if(isfinite(d))
698 if ((Hi & 0x7ff00000) != 0x7ff00000)
699 outs() << format(" (%.16e)\n", d);
701 if (Hi == 0x7ff00000 && Lo == 0)
702 outs() << " (+Infinity)\n";
703 else if (Hi == 0xfff00000 && Lo == 0)
704 outs() << " (-Infinity)\n";
705 else if ((Hi & 0x00080000) == 0x00080000)
706 outs() << " (non-signaling Not-a-Number)\n";
708 outs() << " (signaling Not-a-Number)\n";
712 static void DumpLiteral8Section(MachOObjectFile *O, const char *sect,
713 uint32_t sect_size, uint64_t sect_addr,
714 bool print_addresses) {
715 for (uint32_t i = 0; i < sect_size; i += sizeof(double)) {
716 if (print_addresses) {
718 outs() << format("%016" PRIx64, sect_addr + i) << " ";
720 outs() << format("%08" PRIx64, sect_addr + i) << " ";
723 memcpy(&d, sect + i, sizeof(double));
724 if (O->isLittleEndian() != sys::IsLittleEndianHost)
725 sys::swapByteOrder(d);
727 memcpy(&l0, sect + i, sizeof(uint32_t));
728 memcpy(&l1, sect + i + sizeof(uint32_t), sizeof(uint32_t));
729 if (O->isLittleEndian() != sys::IsLittleEndianHost) {
730 sys::swapByteOrder(l0);
731 sys::swapByteOrder(l1);
733 DumpLiteral8(O, l0, l1, d);
737 static void DumpLiteral16(uint32_t l0, uint32_t l1, uint32_t l2, uint32_t l3) {
738 outs() << format("0x%08" PRIx32, l0) << " ";
739 outs() << format("0x%08" PRIx32, l1) << " ";
740 outs() << format("0x%08" PRIx32, l2) << " ";
741 outs() << format("0x%08" PRIx32, l3) << "\n";
744 static void DumpLiteral16Section(MachOObjectFile *O, const char *sect,
745 uint32_t sect_size, uint64_t sect_addr,
746 bool print_addresses) {
747 for (uint32_t i = 0; i < sect_size; i += 16) {
748 if (print_addresses) {
750 outs() << format("%016" PRIx64, sect_addr + i) << " ";
752 outs() << format("%08" PRIx64, sect_addr + i) << " ";
754 uint32_t l0, l1, l2, l3;
755 memcpy(&l0, sect + i, sizeof(uint32_t));
756 memcpy(&l1, sect + i + sizeof(uint32_t), sizeof(uint32_t));
757 memcpy(&l2, sect + i + 2 * sizeof(uint32_t), sizeof(uint32_t));
758 memcpy(&l3, sect + i + 3 * sizeof(uint32_t), sizeof(uint32_t));
759 if (O->isLittleEndian() != sys::IsLittleEndianHost) {
760 sys::swapByteOrder(l0);
761 sys::swapByteOrder(l1);
762 sys::swapByteOrder(l2);
763 sys::swapByteOrder(l3);
765 DumpLiteral16(l0, l1, l2, l3);
769 static void DumpLiteralPointerSection(MachOObjectFile *O,
770 const SectionRef &Section,
771 const char *sect, uint32_t sect_size,
773 bool print_addresses) {
774 // Collect the literal sections in this Mach-O file.
775 std::vector<SectionRef> LiteralSections;
776 for (const SectionRef &Section : O->sections()) {
777 DataRefImpl Ref = Section.getRawDataRefImpl();
778 uint32_t section_type;
780 const MachO::section_64 Sec = O->getSection64(Ref);
781 section_type = Sec.flags & MachO::SECTION_TYPE;
783 const MachO::section Sec = O->getSection(Ref);
784 section_type = Sec.flags & MachO::SECTION_TYPE;
786 if (section_type == MachO::S_CSTRING_LITERALS ||
787 section_type == MachO::S_4BYTE_LITERALS ||
788 section_type == MachO::S_8BYTE_LITERALS ||
789 section_type == MachO::S_16BYTE_LITERALS)
790 LiteralSections.push_back(Section);
793 // Set the size of the literal pointer.
794 uint32_t lp_size = O->is64Bit() ? 8 : 4;
796 // Collect the external relocation symbols for the literal pointers.
797 std::vector<std::pair<uint64_t, SymbolRef>> Relocs;
798 for (const RelocationRef &Reloc : Section.relocations()) {
800 MachO::any_relocation_info RE;
801 bool isExtern = false;
802 Rel = Reloc.getRawDataRefImpl();
803 RE = O->getRelocation(Rel);
804 isExtern = O->getPlainRelocationExternal(RE);
806 uint64_t RelocOffset = Reloc.getOffset();
807 symbol_iterator RelocSym = Reloc.getSymbol();
808 Relocs.push_back(std::make_pair(RelocOffset, *RelocSym));
811 array_pod_sort(Relocs.begin(), Relocs.end());
813 // Dump each literal pointer.
814 for (uint32_t i = 0; i < sect_size; i += lp_size) {
815 if (print_addresses) {
817 outs() << format("%016" PRIx64, sect_addr + i) << " ";
819 outs() << format("%08" PRIx64, sect_addr + i) << " ";
823 memcpy(&lp, sect + i, sizeof(uint64_t));
824 if (O->isLittleEndian() != sys::IsLittleEndianHost)
825 sys::swapByteOrder(lp);
828 memcpy(&li, sect + i, sizeof(uint32_t));
829 if (O->isLittleEndian() != sys::IsLittleEndianHost)
830 sys::swapByteOrder(li);
834 // First look for an external relocation entry for this literal pointer.
835 auto Reloc = find_if(Relocs, [&](const std::pair<uint64_t, SymbolRef> &P) {
838 if (Reloc != Relocs.end()) {
839 symbol_iterator RelocSym = Reloc->second;
840 Expected<StringRef> SymName = RelocSym->getName();
842 report_error(O->getFileName(), SymName.takeError());
843 outs() << "external relocation entry for symbol:" << *SymName << "\n";
847 // For local references see what the section the literal pointer points to.
848 auto Sect = find_if(LiteralSections, [&](const SectionRef &R) {
849 return lp >= R.getAddress() && lp < R.getAddress() + R.getSize();
851 if (Sect == LiteralSections.end()) {
852 outs() << format("0x%" PRIx64, lp) << " (not in a literal section)\n";
856 uint64_t SectAddress = Sect->getAddress();
857 uint64_t SectSize = Sect->getSize();
860 Sect->getName(SectName);
861 DataRefImpl Ref = Sect->getRawDataRefImpl();
862 StringRef SegmentName = O->getSectionFinalSegmentName(Ref);
863 outs() << SegmentName << ":" << SectName << ":";
865 uint32_t section_type;
867 const MachO::section_64 Sec = O->getSection64(Ref);
868 section_type = Sec.flags & MachO::SECTION_TYPE;
870 const MachO::section Sec = O->getSection(Ref);
871 section_type = Sec.flags & MachO::SECTION_TYPE;
875 Sect->getContents(BytesStr);
876 const char *Contents = reinterpret_cast<const char *>(BytesStr.data());
878 switch (section_type) {
879 case MachO::S_CSTRING_LITERALS:
880 for (uint64_t i = lp - SectAddress; i < SectSize && Contents[i] != '\0';
882 DumpCstringChar(Contents[i]);
886 case MachO::S_4BYTE_LITERALS:
888 memcpy(&f, Contents + (lp - SectAddress), sizeof(float));
890 memcpy(&l, Contents + (lp - SectAddress), sizeof(uint32_t));
891 if (O->isLittleEndian() != sys::IsLittleEndianHost) {
892 sys::swapByteOrder(f);
893 sys::swapByteOrder(l);
897 case MachO::S_8BYTE_LITERALS: {
899 memcpy(&d, Contents + (lp - SectAddress), sizeof(double));
901 memcpy(&l0, Contents + (lp - SectAddress), sizeof(uint32_t));
902 memcpy(&l1, Contents + (lp - SectAddress) + sizeof(uint32_t),
904 if (O->isLittleEndian() != sys::IsLittleEndianHost) {
905 sys::swapByteOrder(f);
906 sys::swapByteOrder(l0);
907 sys::swapByteOrder(l1);
909 DumpLiteral8(O, l0, l1, d);
912 case MachO::S_16BYTE_LITERALS: {
913 uint32_t l0, l1, l2, l3;
914 memcpy(&l0, Contents + (lp - SectAddress), sizeof(uint32_t));
915 memcpy(&l1, Contents + (lp - SectAddress) + sizeof(uint32_t),
917 memcpy(&l2, Contents + (lp - SectAddress) + 2 * sizeof(uint32_t),
919 memcpy(&l3, Contents + (lp - SectAddress) + 3 * sizeof(uint32_t),
921 if (O->isLittleEndian() != sys::IsLittleEndianHost) {
922 sys::swapByteOrder(l0);
923 sys::swapByteOrder(l1);
924 sys::swapByteOrder(l2);
925 sys::swapByteOrder(l3);
927 DumpLiteral16(l0, l1, l2, l3);
934 static void DumpInitTermPointerSection(MachOObjectFile *O, const char *sect,
935 uint32_t sect_size, uint64_t sect_addr,
936 SymbolAddressMap *AddrMap,
939 stride = (O->is64Bit()) ? sizeof(uint64_t) : sizeof(uint32_t);
940 for (uint32_t i = 0; i < sect_size; i += stride) {
941 const char *SymbolName = nullptr;
943 outs() << format("0x%016" PRIx64, sect_addr + i * stride) << " ";
944 uint64_t pointer_value;
945 memcpy(&pointer_value, sect + i, stride);
946 if (O->isLittleEndian() != sys::IsLittleEndianHost)
947 sys::swapByteOrder(pointer_value);
948 outs() << format("0x%016" PRIx64, pointer_value);
950 SymbolName = GuessSymbolName(pointer_value, AddrMap);
952 outs() << format("0x%08" PRIx64, sect_addr + i * stride) << " ";
953 uint32_t pointer_value;
954 memcpy(&pointer_value, sect + i, stride);
955 if (O->isLittleEndian() != sys::IsLittleEndianHost)
956 sys::swapByteOrder(pointer_value);
957 outs() << format("0x%08" PRIx32, pointer_value);
959 SymbolName = GuessSymbolName(pointer_value, AddrMap);
962 outs() << " " << SymbolName;
967 static void DumpRawSectionContents(MachOObjectFile *O, const char *sect,
968 uint32_t size, uint64_t addr) {
969 uint32_t cputype = O->getHeader().cputype;
970 if (cputype == MachO::CPU_TYPE_I386 || cputype == MachO::CPU_TYPE_X86_64) {
972 for (uint32_t i = 0; i < size; i += j, addr += j) {
974 outs() << format("%016" PRIx64, addr) << "\t";
976 outs() << format("%08" PRIx64, addr) << "\t";
977 for (j = 0; j < 16 && i + j < size; j++) {
978 uint8_t byte_word = *(sect + i + j);
979 outs() << format("%02" PRIx32, (uint32_t)byte_word) << " ";
985 for (uint32_t i = 0; i < size; i += j, addr += j) {
987 outs() << format("%016" PRIx64, addr) << "\t";
989 outs() << format("%08" PRIx64, addr) << "\t";
990 for (j = 0; j < 4 * sizeof(int32_t) && i + j < size;
991 j += sizeof(int32_t)) {
992 if (i + j + sizeof(int32_t) <= size) {
994 memcpy(&long_word, sect + i + j, sizeof(int32_t));
995 if (O->isLittleEndian() != sys::IsLittleEndianHost)
996 sys::swapByteOrder(long_word);
997 outs() << format("%08" PRIx32, long_word) << " ";
999 for (uint32_t k = 0; i + j + k < size; k++) {
1000 uint8_t byte_word = *(sect + i + j + k);
1001 outs() << format("%02" PRIx32, (uint32_t)byte_word) << " ";
1010 static void DisassembleMachO(StringRef Filename, MachOObjectFile *MachOOF,
1011 StringRef DisSegName, StringRef DisSectName);
1012 static void DumpProtocolSection(MachOObjectFile *O, const char *sect,
1013 uint32_t size, uint32_t addr);
1015 static void DumpBitcodeSection(MachOObjectFile *O, const char *sect,
1016 uint32_t size, bool verbose,
1017 bool PrintXarHeader, bool PrintXarFileHeaders,
1018 std::string XarMemberName);
1019 #endif // defined(HAVE_LIBXAR)
1021 static void DumpSectionContents(StringRef Filename, MachOObjectFile *O,
1023 SymbolAddressMap AddrMap;
1025 CreateSymbolAddressMap(O, &AddrMap);
1027 for (unsigned i = 0; i < FilterSections.size(); ++i) {
1028 StringRef DumpSection = FilterSections[i];
1029 std::pair<StringRef, StringRef> DumpSegSectName;
1030 DumpSegSectName = DumpSection.split(',');
1031 StringRef DumpSegName, DumpSectName;
1032 if (DumpSegSectName.second.size()) {
1033 DumpSegName = DumpSegSectName.first;
1034 DumpSectName = DumpSegSectName.second;
1037 DumpSectName = DumpSegSectName.first;
1039 for (const SectionRef &Section : O->sections()) {
1041 Section.getName(SectName);
1042 DataRefImpl Ref = Section.getRawDataRefImpl();
1043 StringRef SegName = O->getSectionFinalSegmentName(Ref);
1044 if ((DumpSegName.empty() || SegName == DumpSegName) &&
1045 (SectName == DumpSectName)) {
1047 uint32_t section_flags;
1049 const MachO::section_64 Sec = O->getSection64(Ref);
1050 section_flags = Sec.flags;
1053 const MachO::section Sec = O->getSection(Ref);
1054 section_flags = Sec.flags;
1056 uint32_t section_type = section_flags & MachO::SECTION_TYPE;
1059 Section.getContents(BytesStr);
1060 const char *sect = reinterpret_cast<const char *>(BytesStr.data());
1061 uint32_t sect_size = BytesStr.size();
1062 uint64_t sect_addr = Section.getAddress();
1064 outs() << "Contents of (" << SegName << "," << SectName
1068 if ((section_flags & MachO::S_ATTR_PURE_INSTRUCTIONS) ||
1069 (section_flags & MachO::S_ATTR_SOME_INSTRUCTIONS)) {
1070 DisassembleMachO(Filename, O, SegName, SectName);
1073 if (SegName == "__TEXT" && SectName == "__info_plist") {
1077 if (SegName == "__OBJC" && SectName == "__protocol") {
1078 DumpProtocolSection(O, sect, sect_size, sect_addr);
1082 if (SegName == "__LLVM" && SectName == "__bundle") {
1083 DumpBitcodeSection(O, sect, sect_size, verbose, !NoSymbolicOperands,
1084 ArchiveHeaders, "");
1087 #endif // defined(HAVE_LIBXAR)
1088 switch (section_type) {
1089 case MachO::S_REGULAR:
1090 DumpRawSectionContents(O, sect, sect_size, sect_addr);
1092 case MachO::S_ZEROFILL:
1093 outs() << "zerofill section and has no contents in the file\n";
1095 case MachO::S_CSTRING_LITERALS:
1096 DumpCstringSection(O, sect, sect_size, sect_addr, !NoLeadingAddr);
1098 case MachO::S_4BYTE_LITERALS:
1099 DumpLiteral4Section(O, sect, sect_size, sect_addr, !NoLeadingAddr);
1101 case MachO::S_8BYTE_LITERALS:
1102 DumpLiteral8Section(O, sect, sect_size, sect_addr, !NoLeadingAddr);
1104 case MachO::S_16BYTE_LITERALS:
1105 DumpLiteral16Section(O, sect, sect_size, sect_addr, !NoLeadingAddr);
1107 case MachO::S_LITERAL_POINTERS:
1108 DumpLiteralPointerSection(O, Section, sect, sect_size, sect_addr,
1111 case MachO::S_MOD_INIT_FUNC_POINTERS:
1112 case MachO::S_MOD_TERM_FUNC_POINTERS:
1113 DumpInitTermPointerSection(O, sect, sect_size, sect_addr, &AddrMap,
1117 outs() << "Unknown section type ("
1118 << format("0x%08" PRIx32, section_type) << ")\n";
1119 DumpRawSectionContents(O, sect, sect_size, sect_addr);
1123 if (section_type == MachO::S_ZEROFILL)
1124 outs() << "zerofill section and has no contents in the file\n";
1126 DumpRawSectionContents(O, sect, sect_size, sect_addr);
1133 static void DumpInfoPlistSectionContents(StringRef Filename,
1134 MachOObjectFile *O) {
1135 for (const SectionRef &Section : O->sections()) {
1137 Section.getName(SectName);
1138 DataRefImpl Ref = Section.getRawDataRefImpl();
1139 StringRef SegName = O->getSectionFinalSegmentName(Ref);
1140 if (SegName == "__TEXT" && SectName == "__info_plist") {
1141 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
1143 Section.getContents(BytesStr);
1144 const char *sect = reinterpret_cast<const char *>(BytesStr.data());
1151 // checkMachOAndArchFlags() checks to see if the ObjectFile is a Mach-O file
1152 // and if it is and there is a list of architecture flags is specified then
1153 // check to make sure this Mach-O file is one of those architectures or all
1154 // architectures were specified. If not then an error is generated and this
1155 // routine returns false. Else it returns true.
1156 static bool checkMachOAndArchFlags(ObjectFile *O, StringRef Filename) {
1157 auto *MachO = dyn_cast<MachOObjectFile>(O);
1159 if (!MachO || ArchAll || ArchFlags.empty())
1162 MachO::mach_header H;
1163 MachO::mach_header_64 H_64;
1165 const char *McpuDefault, *ArchFlag;
1166 if (MachO->is64Bit()) {
1167 H_64 = MachO->MachOObjectFile::getHeader64();
1168 T = MachOObjectFile::getArchTriple(H_64.cputype, H_64.cpusubtype,
1169 &McpuDefault, &ArchFlag);
1171 H = MachO->MachOObjectFile::getHeader();
1172 T = MachOObjectFile::getArchTriple(H.cputype, H.cpusubtype,
1173 &McpuDefault, &ArchFlag);
1175 const std::string ArchFlagName(ArchFlag);
1176 if (none_of(ArchFlags, [&](const std::string &Name) {
1177 return Name == ArchFlagName;
1179 errs() << "llvm-objdump: " + Filename + ": No architecture specified.\n";
1185 static void printObjcMetaData(MachOObjectFile *O, bool verbose);
1187 // ProcessMachO() is passed a single opened Mach-O file, which may be an
1188 // archive member and or in a slice of a universal file. It prints the
1189 // the file name and header info and then processes it according to the
1190 // command line options.
1191 static void ProcessMachO(StringRef Name, MachOObjectFile *MachOOF,
1192 StringRef ArchiveMemberName = StringRef(),
1193 StringRef ArchitectureName = StringRef()) {
1194 // If we are doing some processing here on the Mach-O file print the header
1195 // info. And don't print it otherwise like in the case of printing the
1196 // UniversalHeaders or ArchiveHeaders.
1197 if (Disassemble || PrivateHeaders || ExportsTrie || Rebase || Bind || SymbolTable ||
1198 LazyBind || WeakBind || IndirectSymbols || DataInCode || LinkOptHints ||
1199 DylibsUsed || DylibId || ObjcMetaData || (FilterSections.size() != 0)) {
1200 if (!NoLeadingHeaders) {
1202 if (!ArchiveMemberName.empty())
1203 outs() << '(' << ArchiveMemberName << ')';
1204 if (!ArchitectureName.empty())
1205 outs() << " (architecture " << ArchitectureName << ")";
1209 // To use the report_error() form with an ArchiveName and FileName set
1210 // these up based on what is passed for Name and ArchiveMemberName.
1211 StringRef ArchiveName;
1213 if (!ArchiveMemberName.empty()) {
1215 FileName = ArchiveMemberName;
1217 ArchiveName = StringRef();
1221 // If we need the symbol table to do the operation then check it here to
1222 // produce a good error message as to where the Mach-O file comes from in
1223 // the error message.
1224 if (Disassemble || IndirectSymbols || FilterSections.size() != 0 ||
1226 if (Error Err = MachOOF->checkSymbolTable())
1227 report_error(ArchiveName, FileName, std::move(Err), ArchitectureName);
1230 DisassembleMachO(FileName, MachOOF, "__TEXT", "__text");
1231 if (IndirectSymbols)
1232 PrintIndirectSymbols(MachOOF, !NonVerbose);
1234 PrintDataInCodeTable(MachOOF, !NonVerbose);
1236 PrintLinkOptHints(MachOOF);
1238 PrintRelocations(MachOOF);
1240 PrintSectionHeaders(MachOOF);
1241 if (SectionContents)
1242 PrintSectionContents(MachOOF);
1243 if (FilterSections.size() != 0)
1244 DumpSectionContents(FileName, MachOOF, !NonVerbose);
1246 DumpInfoPlistSectionContents(FileName, MachOOF);
1248 PrintDylibs(MachOOF, false);
1250 PrintDylibs(MachOOF, true);
1252 PrintSymbolTable(MachOOF, ArchiveName, ArchitectureName);
1254 printMachOUnwindInfo(MachOOF);
1255 if (PrivateHeaders) {
1256 printMachOFileHeader(MachOOF);
1257 printMachOLoadCommands(MachOOF);
1259 if (FirstPrivateHeader)
1260 printMachOFileHeader(MachOOF);
1262 printObjcMetaData(MachOOF, !NonVerbose);
1264 printExportsTrie(MachOOF);
1266 printRebaseTable(MachOOF);
1268 printBindTable(MachOOF);
1270 printLazyBindTable(MachOOF);
1272 printWeakBindTable(MachOOF);
1274 if (DwarfDumpType != DIDT_Null) {
1275 std::unique_ptr<DIContext> DICtx(new DWARFContextInMemory(*MachOOF));
1276 // Dump the complete DWARF structure.
1277 DICtx->dump(outs(), DwarfDumpType, true /* DumpEH */);
1281 // printUnknownCPUType() helps print_fat_headers for unknown CPU's.
1282 static void printUnknownCPUType(uint32_t cputype, uint32_t cpusubtype) {
1283 outs() << " cputype (" << cputype << ")\n";
1284 outs() << " cpusubtype (" << cpusubtype << ")\n";
1287 // printCPUType() helps print_fat_headers by printing the cputype and
1288 // pusubtype (symbolically for the one's it knows about).
1289 static void printCPUType(uint32_t cputype, uint32_t cpusubtype) {
1291 case MachO::CPU_TYPE_I386:
1292 switch (cpusubtype) {
1293 case MachO::CPU_SUBTYPE_I386_ALL:
1294 outs() << " cputype CPU_TYPE_I386\n";
1295 outs() << " cpusubtype CPU_SUBTYPE_I386_ALL\n";
1298 printUnknownCPUType(cputype, cpusubtype);
1302 case MachO::CPU_TYPE_X86_64:
1303 switch (cpusubtype) {
1304 case MachO::CPU_SUBTYPE_X86_64_ALL:
1305 outs() << " cputype CPU_TYPE_X86_64\n";
1306 outs() << " cpusubtype CPU_SUBTYPE_X86_64_ALL\n";
1308 case MachO::CPU_SUBTYPE_X86_64_H:
1309 outs() << " cputype CPU_TYPE_X86_64\n";
1310 outs() << " cpusubtype CPU_SUBTYPE_X86_64_H\n";
1313 printUnknownCPUType(cputype, cpusubtype);
1317 case MachO::CPU_TYPE_ARM:
1318 switch (cpusubtype) {
1319 case MachO::CPU_SUBTYPE_ARM_ALL:
1320 outs() << " cputype CPU_TYPE_ARM\n";
1321 outs() << " cpusubtype CPU_SUBTYPE_ARM_ALL\n";
1323 case MachO::CPU_SUBTYPE_ARM_V4T:
1324 outs() << " cputype CPU_TYPE_ARM\n";
1325 outs() << " cpusubtype CPU_SUBTYPE_ARM_V4T\n";
1327 case MachO::CPU_SUBTYPE_ARM_V5TEJ:
1328 outs() << " cputype CPU_TYPE_ARM\n";
1329 outs() << " cpusubtype CPU_SUBTYPE_ARM_V5TEJ\n";
1331 case MachO::CPU_SUBTYPE_ARM_XSCALE:
1332 outs() << " cputype CPU_TYPE_ARM\n";
1333 outs() << " cpusubtype CPU_SUBTYPE_ARM_XSCALE\n";
1335 case MachO::CPU_SUBTYPE_ARM_V6:
1336 outs() << " cputype CPU_TYPE_ARM\n";
1337 outs() << " cpusubtype CPU_SUBTYPE_ARM_V6\n";
1339 case MachO::CPU_SUBTYPE_ARM_V6M:
1340 outs() << " cputype CPU_TYPE_ARM\n";
1341 outs() << " cpusubtype CPU_SUBTYPE_ARM_V6M\n";
1343 case MachO::CPU_SUBTYPE_ARM_V7:
1344 outs() << " cputype CPU_TYPE_ARM\n";
1345 outs() << " cpusubtype CPU_SUBTYPE_ARM_V7\n";
1347 case MachO::CPU_SUBTYPE_ARM_V7EM:
1348 outs() << " cputype CPU_TYPE_ARM\n";
1349 outs() << " cpusubtype CPU_SUBTYPE_ARM_V7EM\n";
1351 case MachO::CPU_SUBTYPE_ARM_V7K:
1352 outs() << " cputype CPU_TYPE_ARM\n";
1353 outs() << " cpusubtype CPU_SUBTYPE_ARM_V7K\n";
1355 case MachO::CPU_SUBTYPE_ARM_V7M:
1356 outs() << " cputype CPU_TYPE_ARM\n";
1357 outs() << " cpusubtype CPU_SUBTYPE_ARM_V7M\n";
1359 case MachO::CPU_SUBTYPE_ARM_V7S:
1360 outs() << " cputype CPU_TYPE_ARM\n";
1361 outs() << " cpusubtype CPU_SUBTYPE_ARM_V7S\n";
1364 printUnknownCPUType(cputype, cpusubtype);
1368 case MachO::CPU_TYPE_ARM64:
1369 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
1370 case MachO::CPU_SUBTYPE_ARM64_ALL:
1371 outs() << " cputype CPU_TYPE_ARM64\n";
1372 outs() << " cpusubtype CPU_SUBTYPE_ARM64_ALL\n";
1375 printUnknownCPUType(cputype, cpusubtype);
1380 printUnknownCPUType(cputype, cpusubtype);
1385 static void printMachOUniversalHeaders(const object::MachOUniversalBinary *UB,
1387 outs() << "Fat headers\n";
1389 if (UB->getMagic() == MachO::FAT_MAGIC)
1390 outs() << "fat_magic FAT_MAGIC\n";
1391 else // UB->getMagic() == MachO::FAT_MAGIC_64
1392 outs() << "fat_magic FAT_MAGIC_64\n";
1394 outs() << "fat_magic " << format("0x%" PRIx32, MachO::FAT_MAGIC) << "\n";
1396 uint32_t nfat_arch = UB->getNumberOfObjects();
1397 StringRef Buf = UB->getData();
1398 uint64_t size = Buf.size();
1399 uint64_t big_size = sizeof(struct MachO::fat_header) +
1400 nfat_arch * sizeof(struct MachO::fat_arch);
1401 outs() << "nfat_arch " << UB->getNumberOfObjects();
1403 outs() << " (malformed, contains zero architecture types)\n";
1404 else if (big_size > size)
1405 outs() << " (malformed, architectures past end of file)\n";
1409 for (uint32_t i = 0; i < nfat_arch; ++i) {
1410 MachOUniversalBinary::ObjectForArch OFA(UB, i);
1411 uint32_t cputype = OFA.getCPUType();
1412 uint32_t cpusubtype = OFA.getCPUSubType();
1413 outs() << "architecture ";
1414 for (uint32_t j = 0; i != 0 && j <= i - 1; j++) {
1415 MachOUniversalBinary::ObjectForArch other_OFA(UB, j);
1416 uint32_t other_cputype = other_OFA.getCPUType();
1417 uint32_t other_cpusubtype = other_OFA.getCPUSubType();
1418 if (cputype != 0 && cpusubtype != 0 && cputype == other_cputype &&
1419 (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) ==
1420 (other_cpusubtype & ~MachO::CPU_SUBTYPE_MASK)) {
1421 outs() << "(illegal duplicate architecture) ";
1426 outs() << OFA.getArchFlagName() << "\n";
1427 printCPUType(cputype, cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
1429 outs() << i << "\n";
1430 outs() << " cputype " << cputype << "\n";
1431 outs() << " cpusubtype " << (cpusubtype & ~MachO::CPU_SUBTYPE_MASK)
1435 (cpusubtype & MachO::CPU_SUBTYPE_MASK) == MachO::CPU_SUBTYPE_LIB64)
1436 outs() << " capabilities CPU_SUBTYPE_LIB64\n";
1438 outs() << " capabilities "
1439 << format("0x%" PRIx32,
1440 (cpusubtype & MachO::CPU_SUBTYPE_MASK) >> 24) << "\n";
1441 outs() << " offset " << OFA.getOffset();
1442 if (OFA.getOffset() > size)
1443 outs() << " (past end of file)";
1444 if (OFA.getOffset() % (1 << OFA.getAlign()) != 0)
1445 outs() << " (not aligned on it's alignment (2^" << OFA.getAlign() << ")";
1447 outs() << " size " << OFA.getSize();
1448 big_size = OFA.getOffset() + OFA.getSize();
1449 if (big_size > size)
1450 outs() << " (past end of file)";
1452 outs() << " align 2^" << OFA.getAlign() << " (" << (1 << OFA.getAlign())
1457 static void printArchiveChild(StringRef Filename, const Archive::Child &C,
1458 bool verbose, bool print_offset,
1459 StringRef ArchitectureName = StringRef()) {
1461 outs() << C.getChildOffset() << "\t";
1462 Expected<sys::fs::perms> ModeOrErr = C.getAccessMode();
1464 report_error(Filename, C, ModeOrErr.takeError(), ArchitectureName);
1465 sys::fs::perms Mode = ModeOrErr.get();
1467 // FIXME: this first dash, "-", is for (Mode & S_IFMT) == S_IFREG.
1468 // But there is nothing in sys::fs::perms for S_IFMT or S_IFREG.
1470 outs() << ((Mode & sys::fs::owner_read) ? "r" : "-");
1471 outs() << ((Mode & sys::fs::owner_write) ? "w" : "-");
1472 outs() << ((Mode & sys::fs::owner_exe) ? "x" : "-");
1473 outs() << ((Mode & sys::fs::group_read) ? "r" : "-");
1474 outs() << ((Mode & sys::fs::group_write) ? "w" : "-");
1475 outs() << ((Mode & sys::fs::group_exe) ? "x" : "-");
1476 outs() << ((Mode & sys::fs::others_read) ? "r" : "-");
1477 outs() << ((Mode & sys::fs::others_write) ? "w" : "-");
1478 outs() << ((Mode & sys::fs::others_exe) ? "x" : "-");
1480 outs() << format("0%o ", Mode);
1483 Expected<unsigned> UIDOrErr = C.getUID();
1485 report_error(Filename, C, UIDOrErr.takeError(), ArchitectureName);
1486 unsigned UID = UIDOrErr.get();
1487 outs() << format("%3d/", UID);
1488 Expected<unsigned> GIDOrErr = C.getGID();
1490 report_error(Filename, C, GIDOrErr.takeError(), ArchitectureName);
1491 unsigned GID = GIDOrErr.get();
1492 outs() << format("%-3d ", GID);
1493 Expected<uint64_t> Size = C.getRawSize();
1495 report_error(Filename, C, Size.takeError(), ArchitectureName);
1496 outs() << format("%5" PRId64, Size.get()) << " ";
1498 StringRef RawLastModified = C.getRawLastModified();
1501 if (RawLastModified.getAsInteger(10, Seconds))
1502 outs() << "(date: \"" << RawLastModified
1503 << "\" contains non-decimal chars) ";
1505 // Since cime(3) returns a 26 character string of the form:
1506 // "Sun Sep 16 01:03:52 1973\n\0"
1507 // just print 24 characters.
1509 outs() << format("%.24s ", ctime(&t));
1512 outs() << RawLastModified << " ";
1516 Expected<StringRef> NameOrErr = C.getName();
1518 consumeError(NameOrErr.takeError());
1519 Expected<StringRef> NameOrErr = C.getRawName();
1521 report_error(Filename, C, NameOrErr.takeError(), ArchitectureName);
1522 StringRef RawName = NameOrErr.get();
1523 outs() << RawName << "\n";
1525 StringRef Name = NameOrErr.get();
1526 outs() << Name << "\n";
1529 Expected<StringRef> NameOrErr = C.getRawName();
1531 report_error(Filename, C, NameOrErr.takeError(), ArchitectureName);
1532 StringRef RawName = NameOrErr.get();
1533 outs() << RawName << "\n";
1537 static void printArchiveHeaders(StringRef Filename, Archive *A, bool verbose,
1539 StringRef ArchitectureName = StringRef()) {
1540 Error Err = Error::success();
1542 for (const auto &C : A->children(Err, false))
1543 printArchiveChild(Filename, C, verbose, print_offset, ArchitectureName);
1546 report_error(StringRef(), Filename, std::move(Err), ArchitectureName);
1549 // ParseInputMachO() parses the named Mach-O file in Filename and handles the
1550 // -arch flags selecting just those slices as specified by them and also parses
1551 // archive files. Then for each individual Mach-O file ProcessMachO() is
1552 // called to process the file based on the command line options.
1553 void llvm::ParseInputMachO(StringRef Filename) {
1554 // Check for -arch all and verifiy the -arch flags are valid.
1555 for (unsigned i = 0; i < ArchFlags.size(); ++i) {
1556 if (ArchFlags[i] == "all") {
1559 if (!MachOObjectFile::isValidArch(ArchFlags[i])) {
1560 errs() << "llvm-objdump: Unknown architecture named '" + ArchFlags[i] +
1561 "'for the -arch option\n";
1567 // Attempt to open the binary.
1568 Expected<OwningBinary<Binary>> BinaryOrErr = createBinary(Filename);
1570 report_error(Filename, BinaryOrErr.takeError());
1571 Binary &Bin = *BinaryOrErr.get().getBinary();
1573 if (Archive *A = dyn_cast<Archive>(&Bin)) {
1574 outs() << "Archive : " << Filename << "\n";
1576 printArchiveHeaders(Filename, A, !NonVerbose, ArchiveMemberOffsets);
1578 Error Err = Error::success();
1579 for (auto &C : A->children(Err)) {
1580 Expected<std::unique_ptr<Binary>> ChildOrErr = C.getAsBinary();
1582 if (auto E = isNotObjectErrorInvalidFileType(ChildOrErr.takeError()))
1583 report_error(Filename, C, std::move(E));
1586 if (MachOObjectFile *O = dyn_cast<MachOObjectFile>(&*ChildOrErr.get())) {
1587 if (!checkMachOAndArchFlags(O, Filename))
1589 ProcessMachO(Filename, O, O->getFileName());
1593 report_error(Filename, std::move(Err));
1596 if (UniversalHeaders) {
1597 if (MachOUniversalBinary *UB = dyn_cast<MachOUniversalBinary>(&Bin))
1598 printMachOUniversalHeaders(UB, !NonVerbose);
1600 if (MachOUniversalBinary *UB = dyn_cast<MachOUniversalBinary>(&Bin)) {
1601 // If we have a list of architecture flags specified dump only those.
1602 if (!ArchAll && ArchFlags.size() != 0) {
1603 // Look for a slice in the universal binary that matches each ArchFlag.
1605 for (unsigned i = 0; i < ArchFlags.size(); ++i) {
1607 for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
1608 E = UB->end_objects();
1610 if (ArchFlags[i] == I->getArchFlagName()) {
1612 Expected<std::unique_ptr<ObjectFile>> ObjOrErr =
1613 I->getAsObjectFile();
1614 std::string ArchitectureName = "";
1615 if (ArchFlags.size() > 1)
1616 ArchitectureName = I->getArchFlagName();
1618 ObjectFile &O = *ObjOrErr.get();
1619 if (MachOObjectFile *MachOOF = dyn_cast<MachOObjectFile>(&O))
1620 ProcessMachO(Filename, MachOOF, "", ArchitectureName);
1621 } else if (auto E = isNotObjectErrorInvalidFileType(
1622 ObjOrErr.takeError())) {
1623 report_error(Filename, StringRef(), std::move(E),
1626 } else if (Expected<std::unique_ptr<Archive>> AOrErr =
1627 I->getAsArchive()) {
1628 std::unique_ptr<Archive> &A = *AOrErr;
1629 outs() << "Archive : " << Filename;
1630 if (!ArchitectureName.empty())
1631 outs() << " (architecture " << ArchitectureName << ")";
1634 printArchiveHeaders(Filename, A.get(), !NonVerbose,
1635 ArchiveMemberOffsets, ArchitectureName);
1636 Error Err = Error::success();
1637 for (auto &C : A->children(Err)) {
1638 Expected<std::unique_ptr<Binary>> ChildOrErr = C.getAsBinary();
1640 if (auto E = isNotObjectErrorInvalidFileType(ChildOrErr.takeError()))
1641 report_error(Filename, C, std::move(E), ArchitectureName);
1644 if (MachOObjectFile *O =
1645 dyn_cast<MachOObjectFile>(&*ChildOrErr.get()))
1646 ProcessMachO(Filename, O, O->getFileName(), ArchitectureName);
1649 report_error(Filename, std::move(Err));
1651 consumeError(AOrErr.takeError());
1652 error("Mach-O universal file: " + Filename + " for " +
1653 "architecture " + StringRef(I->getArchFlagName()) +
1654 " is not a Mach-O file or an archive file");
1659 errs() << "llvm-objdump: file: " + Filename + " does not contain "
1660 << "architecture: " + ArchFlags[i] + "\n";
1666 // No architecture flags were specified so if this contains a slice that
1667 // matches the host architecture dump only that.
1669 for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
1670 E = UB->end_objects();
1672 if (MachOObjectFile::getHostArch().getArchName() ==
1673 I->getArchFlagName()) {
1674 Expected<std::unique_ptr<ObjectFile>> ObjOrErr = I->getAsObjectFile();
1675 std::string ArchiveName;
1676 ArchiveName.clear();
1678 ObjectFile &O = *ObjOrErr.get();
1679 if (MachOObjectFile *MachOOF = dyn_cast<MachOObjectFile>(&O))
1680 ProcessMachO(Filename, MachOOF);
1681 } else if (auto E = isNotObjectErrorInvalidFileType(
1682 ObjOrErr.takeError())) {
1683 report_error(Filename, std::move(E));
1685 } else if (Expected<std::unique_ptr<Archive>> AOrErr =
1686 I->getAsArchive()) {
1687 std::unique_ptr<Archive> &A = *AOrErr;
1688 outs() << "Archive : " << Filename << "\n";
1690 printArchiveHeaders(Filename, A.get(), !NonVerbose,
1691 ArchiveMemberOffsets);
1692 Error Err = Error::success();
1693 for (auto &C : A->children(Err)) {
1694 Expected<std::unique_ptr<Binary>> ChildOrErr = C.getAsBinary();
1696 if (auto E = isNotObjectErrorInvalidFileType(ChildOrErr.takeError()))
1697 report_error(Filename, C, std::move(E));
1700 if (MachOObjectFile *O =
1701 dyn_cast<MachOObjectFile>(&*ChildOrErr.get()))
1702 ProcessMachO(Filename, O, O->getFileName());
1705 report_error(Filename, std::move(Err));
1707 consumeError(AOrErr.takeError());
1708 error("Mach-O universal file: " + Filename + " for architecture " +
1709 StringRef(I->getArchFlagName()) +
1710 " is not a Mach-O file or an archive file");
1716 // Either all architectures have been specified or none have been specified
1717 // and this does not contain the host architecture so dump all the slices.
1718 bool moreThanOneArch = UB->getNumberOfObjects() > 1;
1719 for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
1720 E = UB->end_objects();
1722 Expected<std::unique_ptr<ObjectFile>> ObjOrErr = I->getAsObjectFile();
1723 std::string ArchitectureName = "";
1724 if (moreThanOneArch)
1725 ArchitectureName = I->getArchFlagName();
1727 ObjectFile &Obj = *ObjOrErr.get();
1728 if (MachOObjectFile *MachOOF = dyn_cast<MachOObjectFile>(&Obj))
1729 ProcessMachO(Filename, MachOOF, "", ArchitectureName);
1730 } else if (auto E = isNotObjectErrorInvalidFileType(
1731 ObjOrErr.takeError())) {
1732 report_error(StringRef(), Filename, std::move(E), ArchitectureName);
1734 } else if (Expected<std::unique_ptr<Archive>> AOrErr =
1735 I->getAsArchive()) {
1736 std::unique_ptr<Archive> &A = *AOrErr;
1737 outs() << "Archive : " << Filename;
1738 if (!ArchitectureName.empty())
1739 outs() << " (architecture " << ArchitectureName << ")";
1742 printArchiveHeaders(Filename, A.get(), !NonVerbose,
1743 ArchiveMemberOffsets, ArchitectureName);
1744 Error Err = Error::success();
1745 for (auto &C : A->children(Err)) {
1746 Expected<std::unique_ptr<Binary>> ChildOrErr = C.getAsBinary();
1748 if (auto E = isNotObjectErrorInvalidFileType(ChildOrErr.takeError()))
1749 report_error(Filename, C, std::move(E), ArchitectureName);
1752 if (MachOObjectFile *O =
1753 dyn_cast<MachOObjectFile>(&*ChildOrErr.get())) {
1754 if (MachOObjectFile *MachOOF = dyn_cast<MachOObjectFile>(O))
1755 ProcessMachO(Filename, MachOOF, MachOOF->getFileName(),
1760 report_error(Filename, std::move(Err));
1762 consumeError(AOrErr.takeError());
1763 error("Mach-O universal file: " + Filename + " for architecture " +
1764 StringRef(I->getArchFlagName()) +
1765 " is not a Mach-O file or an archive file");
1770 if (ObjectFile *O = dyn_cast<ObjectFile>(&Bin)) {
1771 if (!checkMachOAndArchFlags(O, Filename))
1773 if (MachOObjectFile *MachOOF = dyn_cast<MachOObjectFile>(&*O)) {
1774 ProcessMachO(Filename, MachOOF);
1776 errs() << "llvm-objdump: '" << Filename << "': "
1777 << "Object is not a Mach-O file type.\n";
1780 llvm_unreachable("Input object can't be invalid at this point");
1783 // The block of info used by the Symbolizer call backs.
1784 struct DisassembleInfo {
1788 SymbolAddressMap *AddrMap;
1789 std::vector<SectionRef> *Sections;
1790 const char *class_name;
1791 const char *selector_name;
1793 char *demangled_name;
1796 std::unique_ptr<SymbolAddressMap> bindtable;
1800 // SymbolizerGetOpInfo() is the operand information call back function.
1801 // This is called to get the symbolic information for operand(s) of an
1802 // instruction when it is being done. This routine does this from
1803 // the relocation information, symbol table, etc. That block of information
1804 // is a pointer to the struct DisassembleInfo that was passed when the
1805 // disassembler context was created and passed to back to here when
1806 // called back by the disassembler for instruction operands that could have
1807 // relocation information. The address of the instruction containing operand is
1808 // at the Pc parameter. The immediate value the operand has is passed in
1809 // op_info->Value and is at Offset past the start of the instruction and has a
1810 // byte Size of 1, 2 or 4. The symbolc information is returned in TagBuf is the
1811 // LLVMOpInfo1 struct defined in the header "llvm-c/Disassembler.h" as symbol
1812 // names and addends of the symbolic expression to add for the operand. The
1813 // value of TagType is currently 1 (for the LLVMOpInfo1 struct). If symbolic
1814 // information is returned then this function returns 1 else it returns 0.
1815 static int SymbolizerGetOpInfo(void *DisInfo, uint64_t Pc, uint64_t Offset,
1816 uint64_t Size, int TagType, void *TagBuf) {
1817 struct DisassembleInfo *info = (struct DisassembleInfo *)DisInfo;
1818 struct LLVMOpInfo1 *op_info = (struct LLVMOpInfo1 *)TagBuf;
1819 uint64_t value = op_info->Value;
1821 // Make sure all fields returned are zero if we don't set them.
1822 memset((void *)op_info, '\0', sizeof(struct LLVMOpInfo1));
1823 op_info->Value = value;
1825 // If the TagType is not the value 1 which it code knows about or if no
1826 // verbose symbolic information is wanted then just return 0, indicating no
1827 // information is being returned.
1828 if (TagType != 1 || !info->verbose)
1831 unsigned int Arch = info->O->getArch();
1832 if (Arch == Triple::x86) {
1833 if (Size != 1 && Size != 2 && Size != 4 && Size != 0)
1835 if (info->O->getHeader().filetype != MachO::MH_OBJECT) {
1837 // Search the external relocation entries of a fully linked image
1838 // (if any) for an entry that matches this segment offset.
1839 // uint32_t seg_offset = (Pc + Offset);
1842 // In MH_OBJECT filetypes search the section's relocation entries (if any)
1843 // for an entry for this section offset.
1844 uint32_t sect_addr = info->S.getAddress();
1845 uint32_t sect_offset = (Pc + Offset) - sect_addr;
1846 bool reloc_found = false;
1848 MachO::any_relocation_info RE;
1849 bool isExtern = false;
1851 bool r_scattered = false;
1852 uint32_t r_value, pair_r_value, r_type;
1853 for (const RelocationRef &Reloc : info->S.relocations()) {
1854 uint64_t RelocOffset = Reloc.getOffset();
1855 if (RelocOffset == sect_offset) {
1856 Rel = Reloc.getRawDataRefImpl();
1857 RE = info->O->getRelocation(Rel);
1858 r_type = info->O->getAnyRelocationType(RE);
1859 r_scattered = info->O->isRelocationScattered(RE);
1861 r_value = info->O->getScatteredRelocationValue(RE);
1862 if (r_type == MachO::GENERIC_RELOC_SECTDIFF ||
1863 r_type == MachO::GENERIC_RELOC_LOCAL_SECTDIFF) {
1864 DataRefImpl RelNext = Rel;
1865 info->O->moveRelocationNext(RelNext);
1866 MachO::any_relocation_info RENext;
1867 RENext = info->O->getRelocation(RelNext);
1868 if (info->O->isRelocationScattered(RENext))
1869 pair_r_value = info->O->getScatteredRelocationValue(RENext);
1874 isExtern = info->O->getPlainRelocationExternal(RE);
1876 symbol_iterator RelocSym = Reloc.getSymbol();
1884 if (reloc_found && isExtern) {
1885 Expected<StringRef> SymName = Symbol.getName();
1887 report_error(info->O->getFileName(), SymName.takeError());
1888 const char *name = SymName->data();
1889 op_info->AddSymbol.Present = 1;
1890 op_info->AddSymbol.Name = name;
1891 // For i386 extern relocation entries the value in the instruction is
1892 // the offset from the symbol, and value is already set in op_info->Value.
1895 if (reloc_found && (r_type == MachO::GENERIC_RELOC_SECTDIFF ||
1896 r_type == MachO::GENERIC_RELOC_LOCAL_SECTDIFF)) {
1897 const char *add = GuessSymbolName(r_value, info->AddrMap);
1898 const char *sub = GuessSymbolName(pair_r_value, info->AddrMap);
1899 uint32_t offset = value - (r_value - pair_r_value);
1900 op_info->AddSymbol.Present = 1;
1902 op_info->AddSymbol.Name = add;
1904 op_info->AddSymbol.Value = r_value;
1905 op_info->SubtractSymbol.Present = 1;
1907 op_info->SubtractSymbol.Name = sub;
1909 op_info->SubtractSymbol.Value = pair_r_value;
1910 op_info->Value = offset;
1915 if (Arch == Triple::x86_64) {
1916 if (Size != 1 && Size != 2 && Size != 4 && Size != 0)
1918 if (info->O->getHeader().filetype != MachO::MH_OBJECT) {
1920 // Search the external relocation entries of a fully linked image
1921 // (if any) for an entry that matches this segment offset.
1922 // uint64_t seg_offset = (Pc + Offset);
1925 // In MH_OBJECT filetypes search the section's relocation entries (if any)
1926 // for an entry for this section offset.
1927 uint64_t sect_addr = info->S.getAddress();
1928 uint64_t sect_offset = (Pc + Offset) - sect_addr;
1929 bool reloc_found = false;
1931 MachO::any_relocation_info RE;
1932 bool isExtern = false;
1934 for (const RelocationRef &Reloc : info->S.relocations()) {
1935 uint64_t RelocOffset = Reloc.getOffset();
1936 if (RelocOffset == sect_offset) {
1937 Rel = Reloc.getRawDataRefImpl();
1938 RE = info->O->getRelocation(Rel);
1939 // NOTE: Scattered relocations don't exist on x86_64.
1940 isExtern = info->O->getPlainRelocationExternal(RE);
1942 symbol_iterator RelocSym = Reloc.getSymbol();
1949 if (reloc_found && isExtern) {
1950 // The Value passed in will be adjusted by the Pc if the instruction
1951 // adds the Pc. But for x86_64 external relocation entries the Value
1952 // is the offset from the external symbol.
1953 if (info->O->getAnyRelocationPCRel(RE))
1954 op_info->Value -= Pc + Offset + Size;
1955 Expected<StringRef> SymName = Symbol.getName();
1957 report_error(info->O->getFileName(), SymName.takeError());
1958 const char *name = SymName->data();
1959 unsigned Type = info->O->getAnyRelocationType(RE);
1960 if (Type == MachO::X86_64_RELOC_SUBTRACTOR) {
1961 DataRefImpl RelNext = Rel;
1962 info->O->moveRelocationNext(RelNext);
1963 MachO::any_relocation_info RENext = info->O->getRelocation(RelNext);
1964 unsigned TypeNext = info->O->getAnyRelocationType(RENext);
1965 bool isExternNext = info->O->getPlainRelocationExternal(RENext);
1966 unsigned SymbolNum = info->O->getPlainRelocationSymbolNum(RENext);
1967 if (TypeNext == MachO::X86_64_RELOC_UNSIGNED && isExternNext) {
1968 op_info->SubtractSymbol.Present = 1;
1969 op_info->SubtractSymbol.Name = name;
1970 symbol_iterator RelocSymNext = info->O->getSymbolByIndex(SymbolNum);
1971 Symbol = *RelocSymNext;
1972 Expected<StringRef> SymNameNext = Symbol.getName();
1974 report_error(info->O->getFileName(), SymNameNext.takeError());
1975 name = SymNameNext->data();
1978 // TODO: add the VariantKinds to op_info->VariantKind for relocation types
1979 // like: X86_64_RELOC_TLV, X86_64_RELOC_GOT_LOAD and X86_64_RELOC_GOT.
1980 op_info->AddSymbol.Present = 1;
1981 op_info->AddSymbol.Name = name;
1986 if (Arch == Triple::arm) {
1987 if (Offset != 0 || (Size != 4 && Size != 2))
1989 if (info->O->getHeader().filetype != MachO::MH_OBJECT) {
1991 // Search the external relocation entries of a fully linked image
1992 // (if any) for an entry that matches this segment offset.
1993 // uint32_t seg_offset = (Pc + Offset);
1996 // In MH_OBJECT filetypes search the section's relocation entries (if any)
1997 // for an entry for this section offset.
1998 uint32_t sect_addr = info->S.getAddress();
1999 uint32_t sect_offset = (Pc + Offset) - sect_addr;
2001 MachO::any_relocation_info RE;
2002 bool isExtern = false;
2004 bool r_scattered = false;
2005 uint32_t r_value, pair_r_value, r_type, r_length, other_half;
2007 find_if(info->S.relocations(), [&](const RelocationRef &Reloc) {
2008 uint64_t RelocOffset = Reloc.getOffset();
2009 return RelocOffset == sect_offset;
2012 if (Reloc == info->S.relocations().end())
2015 Rel = Reloc->getRawDataRefImpl();
2016 RE = info->O->getRelocation(Rel);
2017 r_length = info->O->getAnyRelocationLength(RE);
2018 r_scattered = info->O->isRelocationScattered(RE);
2020 r_value = info->O->getScatteredRelocationValue(RE);
2021 r_type = info->O->getScatteredRelocationType(RE);
2023 r_type = info->O->getAnyRelocationType(RE);
2024 isExtern = info->O->getPlainRelocationExternal(RE);
2026 symbol_iterator RelocSym = Reloc->getSymbol();
2030 if (r_type == MachO::ARM_RELOC_HALF ||
2031 r_type == MachO::ARM_RELOC_SECTDIFF ||
2032 r_type == MachO::ARM_RELOC_LOCAL_SECTDIFF ||
2033 r_type == MachO::ARM_RELOC_HALF_SECTDIFF) {
2034 DataRefImpl RelNext = Rel;
2035 info->O->moveRelocationNext(RelNext);
2036 MachO::any_relocation_info RENext;
2037 RENext = info->O->getRelocation(RelNext);
2038 other_half = info->O->getAnyRelocationAddress(RENext) & 0xffff;
2039 if (info->O->isRelocationScattered(RENext))
2040 pair_r_value = info->O->getScatteredRelocationValue(RENext);
2044 Expected<StringRef> SymName = Symbol.getName();
2046 report_error(info->O->getFileName(), SymName.takeError());
2047 const char *name = SymName->data();
2048 op_info->AddSymbol.Present = 1;
2049 op_info->AddSymbol.Name = name;
2051 case MachO::ARM_RELOC_HALF:
2052 if ((r_length & 0x1) == 1) {
2053 op_info->Value = value << 16 | other_half;
2054 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM_HI16;
2056 op_info->Value = other_half << 16 | value;
2057 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM_LO16;
2065 // If we have a branch that is not an external relocation entry then
2066 // return 0 so the code in tryAddingSymbolicOperand() can use the
2067 // SymbolLookUp call back with the branch target address to look up the
2068 // symbol and possibility add an annotation for a symbol stub.
2069 if (isExtern == 0 && (r_type == MachO::ARM_RELOC_BR24 ||
2070 r_type == MachO::ARM_THUMB_RELOC_BR22))
2073 uint32_t offset = 0;
2074 if (r_type == MachO::ARM_RELOC_HALF ||
2075 r_type == MachO::ARM_RELOC_HALF_SECTDIFF) {
2076 if ((r_length & 0x1) == 1)
2077 value = value << 16 | other_half;
2079 value = other_half << 16 | value;
2081 if (r_scattered && (r_type != MachO::ARM_RELOC_HALF &&
2082 r_type != MachO::ARM_RELOC_HALF_SECTDIFF)) {
2083 offset = value - r_value;
2087 if (r_type == MachO::ARM_RELOC_HALF_SECTDIFF) {
2088 if ((r_length & 0x1) == 1)
2089 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM_HI16;
2091 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM_LO16;
2092 const char *add = GuessSymbolName(r_value, info->AddrMap);
2093 const char *sub = GuessSymbolName(pair_r_value, info->AddrMap);
2094 int32_t offset = value - (r_value - pair_r_value);
2095 op_info->AddSymbol.Present = 1;
2097 op_info->AddSymbol.Name = add;
2099 op_info->AddSymbol.Value = r_value;
2100 op_info->SubtractSymbol.Present = 1;
2102 op_info->SubtractSymbol.Name = sub;
2104 op_info->SubtractSymbol.Value = pair_r_value;
2105 op_info->Value = offset;
2109 op_info->AddSymbol.Present = 1;
2110 op_info->Value = offset;
2111 if (r_type == MachO::ARM_RELOC_HALF) {
2112 if ((r_length & 0x1) == 1)
2113 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM_HI16;
2115 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM_LO16;
2117 const char *add = GuessSymbolName(value, info->AddrMap);
2118 if (add != nullptr) {
2119 op_info->AddSymbol.Name = add;
2122 op_info->AddSymbol.Value = value;
2125 if (Arch == Triple::aarch64) {
2126 if (Offset != 0 || Size != 4)
2128 if (info->O->getHeader().filetype != MachO::MH_OBJECT) {
2130 // Search the external relocation entries of a fully linked image
2131 // (if any) for an entry that matches this segment offset.
2132 // uint64_t seg_offset = (Pc + Offset);
2135 // In MH_OBJECT filetypes search the section's relocation entries (if any)
2136 // for an entry for this section offset.
2137 uint64_t sect_addr = info->S.getAddress();
2138 uint64_t sect_offset = (Pc + Offset) - sect_addr;
2140 find_if(info->S.relocations(), [&](const RelocationRef &Reloc) {
2141 uint64_t RelocOffset = Reloc.getOffset();
2142 return RelocOffset == sect_offset;
2145 if (Reloc == info->S.relocations().end())
2148 DataRefImpl Rel = Reloc->getRawDataRefImpl();
2149 MachO::any_relocation_info RE = info->O->getRelocation(Rel);
2150 uint32_t r_type = info->O->getAnyRelocationType(RE);
2151 if (r_type == MachO::ARM64_RELOC_ADDEND) {
2152 DataRefImpl RelNext = Rel;
2153 info->O->moveRelocationNext(RelNext);
2154 MachO::any_relocation_info RENext = info->O->getRelocation(RelNext);
2156 value = info->O->getPlainRelocationSymbolNum(RENext);
2157 op_info->Value = value;
2160 // NOTE: Scattered relocations don't exist on arm64.
2161 if (!info->O->getPlainRelocationExternal(RE))
2163 Expected<StringRef> SymName = Reloc->getSymbol()->getName();
2165 report_error(info->O->getFileName(), SymName.takeError());
2166 const char *name = SymName->data();
2167 op_info->AddSymbol.Present = 1;
2168 op_info->AddSymbol.Name = name;
2171 case MachO::ARM64_RELOC_PAGE21:
2173 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM64_PAGE;
2175 case MachO::ARM64_RELOC_PAGEOFF12:
2177 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM64_PAGEOFF;
2179 case MachO::ARM64_RELOC_GOT_LOAD_PAGE21:
2181 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM64_GOTPAGE;
2183 case MachO::ARM64_RELOC_GOT_LOAD_PAGEOFF12:
2185 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM64_GOTPAGEOFF;
2187 case MachO::ARM64_RELOC_TLVP_LOAD_PAGE21:
2188 /* @tvlppage is not implemented in llvm-mc */
2189 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM64_TLVP;
2191 case MachO::ARM64_RELOC_TLVP_LOAD_PAGEOFF12:
2192 /* @tvlppageoff is not implemented in llvm-mc */
2193 op_info->VariantKind = LLVMDisassembler_VariantKind_ARM64_TLVOFF;
2196 case MachO::ARM64_RELOC_BRANCH26:
2197 op_info->VariantKind = LLVMDisassembler_VariantKind_None;
2205 // GuessCstringPointer is passed the address of what might be a pointer to a
2206 // literal string in a cstring section. If that address is in a cstring section
2207 // it returns a pointer to that string. Else it returns nullptr.
2208 static const char *GuessCstringPointer(uint64_t ReferenceValue,
2209 struct DisassembleInfo *info) {
2210 for (const auto &Load : info->O->load_commands()) {
2211 if (Load.C.cmd == MachO::LC_SEGMENT_64) {
2212 MachO::segment_command_64 Seg = info->O->getSegment64LoadCommand(Load);
2213 for (unsigned J = 0; J < Seg.nsects; ++J) {
2214 MachO::section_64 Sec = info->O->getSection64(Load, J);
2215 uint32_t section_type = Sec.flags & MachO::SECTION_TYPE;
2216 if (section_type == MachO::S_CSTRING_LITERALS &&
2217 ReferenceValue >= Sec.addr &&
2218 ReferenceValue < Sec.addr + Sec.size) {
2219 uint64_t sect_offset = ReferenceValue - Sec.addr;
2220 uint64_t object_offset = Sec.offset + sect_offset;
2221 StringRef MachOContents = info->O->getData();
2222 uint64_t object_size = MachOContents.size();
2223 const char *object_addr = (const char *)MachOContents.data();
2224 if (object_offset < object_size) {
2225 const char *name = object_addr + object_offset;
2232 } else if (Load.C.cmd == MachO::LC_SEGMENT) {
2233 MachO::segment_command Seg = info->O->getSegmentLoadCommand(Load);
2234 for (unsigned J = 0; J < Seg.nsects; ++J) {
2235 MachO::section Sec = info->O->getSection(Load, J);
2236 uint32_t section_type = Sec.flags & MachO::SECTION_TYPE;
2237 if (section_type == MachO::S_CSTRING_LITERALS &&
2238 ReferenceValue >= Sec.addr &&
2239 ReferenceValue < Sec.addr + Sec.size) {
2240 uint64_t sect_offset = ReferenceValue - Sec.addr;
2241 uint64_t object_offset = Sec.offset + sect_offset;
2242 StringRef MachOContents = info->O->getData();
2243 uint64_t object_size = MachOContents.size();
2244 const char *object_addr = (const char *)MachOContents.data();
2245 if (object_offset < object_size) {
2246 const char *name = object_addr + object_offset;
2258 // GuessIndirectSymbol returns the name of the indirect symbol for the
2259 // ReferenceValue passed in or nullptr. This is used when ReferenceValue maybe
2260 // an address of a symbol stub or a lazy or non-lazy pointer to associate the
2261 // symbol name being referenced by the stub or pointer.
2262 static const char *GuessIndirectSymbol(uint64_t ReferenceValue,
2263 struct DisassembleInfo *info) {
2264 MachO::dysymtab_command Dysymtab = info->O->getDysymtabLoadCommand();
2265 MachO::symtab_command Symtab = info->O->getSymtabLoadCommand();
2266 for (const auto &Load : info->O->load_commands()) {
2267 if (Load.C.cmd == MachO::LC_SEGMENT_64) {
2268 MachO::segment_command_64 Seg = info->O->getSegment64LoadCommand(Load);
2269 for (unsigned J = 0; J < Seg.nsects; ++J) {
2270 MachO::section_64 Sec = info->O->getSection64(Load, J);
2271 uint32_t section_type = Sec.flags & MachO::SECTION_TYPE;
2272 if ((section_type == MachO::S_NON_LAZY_SYMBOL_POINTERS ||
2273 section_type == MachO::S_LAZY_SYMBOL_POINTERS ||
2274 section_type == MachO::S_LAZY_DYLIB_SYMBOL_POINTERS ||
2275 section_type == MachO::S_THREAD_LOCAL_VARIABLE_POINTERS ||
2276 section_type == MachO::S_SYMBOL_STUBS) &&
2277 ReferenceValue >= Sec.addr &&
2278 ReferenceValue < Sec.addr + Sec.size) {
2280 if (section_type == MachO::S_SYMBOL_STUBS)
2281 stride = Sec.reserved2;
2286 uint32_t index = Sec.reserved1 + (ReferenceValue - Sec.addr) / stride;
2287 if (index < Dysymtab.nindirectsyms) {
2288 uint32_t indirect_symbol =
2289 info->O->getIndirectSymbolTableEntry(Dysymtab, index);
2290 if (indirect_symbol < Symtab.nsyms) {
2291 symbol_iterator Sym = info->O->getSymbolByIndex(indirect_symbol);
2292 SymbolRef Symbol = *Sym;
2293 Expected<StringRef> SymName = Symbol.getName();
2295 report_error(info->O->getFileName(), SymName.takeError());
2296 const char *name = SymName->data();
2302 } else if (Load.C.cmd == MachO::LC_SEGMENT) {
2303 MachO::segment_command Seg = info->O->getSegmentLoadCommand(Load);
2304 for (unsigned J = 0; J < Seg.nsects; ++J) {
2305 MachO::section Sec = info->O->getSection(Load, J);
2306 uint32_t section_type = Sec.flags & MachO::SECTION_TYPE;
2307 if ((section_type == MachO::S_NON_LAZY_SYMBOL_POINTERS ||
2308 section_type == MachO::S_LAZY_SYMBOL_POINTERS ||
2309 section_type == MachO::S_LAZY_DYLIB_SYMBOL_POINTERS ||
2310 section_type == MachO::S_THREAD_LOCAL_VARIABLE_POINTERS ||
2311 section_type == MachO::S_SYMBOL_STUBS) &&
2312 ReferenceValue >= Sec.addr &&
2313 ReferenceValue < Sec.addr + Sec.size) {
2315 if (section_type == MachO::S_SYMBOL_STUBS)
2316 stride = Sec.reserved2;
2321 uint32_t index = Sec.reserved1 + (ReferenceValue - Sec.addr) / stride;
2322 if (index < Dysymtab.nindirectsyms) {
2323 uint32_t indirect_symbol =
2324 info->O->getIndirectSymbolTableEntry(Dysymtab, index);
2325 if (indirect_symbol < Symtab.nsyms) {
2326 symbol_iterator Sym = info->O->getSymbolByIndex(indirect_symbol);
2327 SymbolRef Symbol = *Sym;
2328 Expected<StringRef> SymName = Symbol.getName();
2330 report_error(info->O->getFileName(), SymName.takeError());
2331 const char *name = SymName->data();
2342 // method_reference() is called passing it the ReferenceName that might be
2343 // a reference it to an Objective-C method call. If so then it allocates and
2344 // assembles a method call string with the values last seen and saved in
2345 // the DisassembleInfo's class_name and selector_name fields. This is saved
2346 // into the method field of the info and any previous string is free'ed.
2347 // Then the class_name field in the info is set to nullptr. The method call
2348 // string is set into ReferenceName and ReferenceType is set to
2349 // LLVMDisassembler_ReferenceType_Out_Objc_Message. If this not a method call
2350 // then both ReferenceType and ReferenceName are left unchanged.
2351 static void method_reference(struct DisassembleInfo *info,
2352 uint64_t *ReferenceType,
2353 const char **ReferenceName) {
2354 unsigned int Arch = info->O->getArch();
2355 if (*ReferenceName != nullptr) {
2356 if (strcmp(*ReferenceName, "_objc_msgSend") == 0) {
2357 if (info->selector_name != nullptr) {
2358 if (info->method != nullptr)
2360 if (info->class_name != nullptr) {
2361 info->method = (char *)malloc(5 + strlen(info->class_name) +
2362 strlen(info->selector_name));
2363 if (info->method != nullptr) {
2364 strcpy(info->method, "+[");
2365 strcat(info->method, info->class_name);
2366 strcat(info->method, " ");
2367 strcat(info->method, info->selector_name);
2368 strcat(info->method, "]");
2369 *ReferenceName = info->method;
2370 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Message;
2373 info->method = (char *)malloc(9 + strlen(info->selector_name));
2374 if (info->method != nullptr) {
2375 if (Arch == Triple::x86_64)
2376 strcpy(info->method, "-[%rdi ");
2377 else if (Arch == Triple::aarch64)
2378 strcpy(info->method, "-[x0 ");
2380 strcpy(info->method, "-[r? ");
2381 strcat(info->method, info->selector_name);
2382 strcat(info->method, "]");
2383 *ReferenceName = info->method;
2384 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Message;
2387 info->class_name = nullptr;
2389 } else if (strcmp(*ReferenceName, "_objc_msgSendSuper2") == 0) {
2390 if (info->selector_name != nullptr) {
2391 if (info->method != nullptr)
2393 info->method = (char *)malloc(17 + strlen(info->selector_name));
2394 if (info->method != nullptr) {
2395 if (Arch == Triple::x86_64)
2396 strcpy(info->method, "-[[%rdi super] ");
2397 else if (Arch == Triple::aarch64)
2398 strcpy(info->method, "-[[x0 super] ");
2400 strcpy(info->method, "-[[r? super] ");
2401 strcat(info->method, info->selector_name);
2402 strcat(info->method, "]");
2403 *ReferenceName = info->method;
2404 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Message;
2406 info->class_name = nullptr;
2412 // GuessPointerPointer() is passed the address of what might be a pointer to
2413 // a reference to an Objective-C class, selector, message ref or cfstring.
2414 // If so the value of the pointer is returned and one of the booleans are set
2415 // to true. If not zero is returned and all the booleans are set to false.
2416 static uint64_t GuessPointerPointer(uint64_t ReferenceValue,
2417 struct DisassembleInfo *info,
2418 bool &classref, bool &selref, bool &msgref,
2424 for (const auto &Load : info->O->load_commands()) {
2425 if (Load.C.cmd == MachO::LC_SEGMENT_64) {
2426 MachO::segment_command_64 Seg = info->O->getSegment64LoadCommand(Load);
2427 for (unsigned J = 0; J < Seg.nsects; ++J) {
2428 MachO::section_64 Sec = info->O->getSection64(Load, J);
2429 if ((strncmp(Sec.sectname, "__objc_selrefs", 16) == 0 ||
2430 strncmp(Sec.sectname, "__objc_classrefs", 16) == 0 ||
2431 strncmp(Sec.sectname, "__objc_superrefs", 16) == 0 ||
2432 strncmp(Sec.sectname, "__objc_msgrefs", 16) == 0 ||
2433 strncmp(Sec.sectname, "__cfstring", 16) == 0) &&
2434 ReferenceValue >= Sec.addr &&
2435 ReferenceValue < Sec.addr + Sec.size) {
2436 uint64_t sect_offset = ReferenceValue - Sec.addr;
2437 uint64_t object_offset = Sec.offset + sect_offset;
2438 StringRef MachOContents = info->O->getData();
2439 uint64_t object_size = MachOContents.size();
2440 const char *object_addr = (const char *)MachOContents.data();
2441 if (object_offset < object_size) {
2442 uint64_t pointer_value;
2443 memcpy(&pointer_value, object_addr + object_offset,
2445 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
2446 sys::swapByteOrder(pointer_value);
2447 if (strncmp(Sec.sectname, "__objc_selrefs", 16) == 0)
2449 else if (strncmp(Sec.sectname, "__objc_classrefs", 16) == 0 ||
2450 strncmp(Sec.sectname, "__objc_superrefs", 16) == 0)
2452 else if (strncmp(Sec.sectname, "__objc_msgrefs", 16) == 0 &&
2453 ReferenceValue + 8 < Sec.addr + Sec.size) {
2455 memcpy(&pointer_value, object_addr + object_offset + 8,
2457 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
2458 sys::swapByteOrder(pointer_value);
2459 } else if (strncmp(Sec.sectname, "__cfstring", 16) == 0)
2461 return pointer_value;
2468 // TODO: Look for LC_SEGMENT for 32-bit Mach-O files.
2473 // get_pointer_64 returns a pointer to the bytes in the object file at the
2474 // Address from a section in the Mach-O file. And indirectly returns the
2475 // offset into the section, number of bytes left in the section past the offset
2476 // and which section is was being referenced. If the Address is not in a
2477 // section nullptr is returned.
2478 static const char *get_pointer_64(uint64_t Address, uint32_t &offset,
2479 uint32_t &left, SectionRef &S,
2480 DisassembleInfo *info,
2481 bool objc_only = false) {
2485 for (unsigned SectIdx = 0; SectIdx != info->Sections->size(); SectIdx++) {
2486 uint64_t SectAddress = ((*(info->Sections))[SectIdx]).getAddress();
2487 uint64_t SectSize = ((*(info->Sections))[SectIdx]).getSize();
2492 ((*(info->Sections))[SectIdx]).getName(SectName);
2493 DataRefImpl Ref = ((*(info->Sections))[SectIdx]).getRawDataRefImpl();
2494 StringRef SegName = info->O->getSectionFinalSegmentName(Ref);
2495 if (SegName != "__OBJC" && SectName != "__cstring")
2498 if (Address >= SectAddress && Address < SectAddress + SectSize) {
2499 S = (*(info->Sections))[SectIdx];
2500 offset = Address - SectAddress;
2501 left = SectSize - offset;
2502 StringRef SectContents;
2503 ((*(info->Sections))[SectIdx]).getContents(SectContents);
2504 return SectContents.data() + offset;
2510 static const char *get_pointer_32(uint32_t Address, uint32_t &offset,
2511 uint32_t &left, SectionRef &S,
2512 DisassembleInfo *info,
2513 bool objc_only = false) {
2514 return get_pointer_64(Address, offset, left, S, info, objc_only);
2517 // get_symbol_64() returns the name of a symbol (or nullptr) and the address of
2518 // the symbol indirectly through n_value. Based on the relocation information
2519 // for the specified section offset in the specified section reference.
2520 // If no relocation information is found and a non-zero ReferenceValue for the
2521 // symbol is passed, look up that address in the info's AddrMap.
2522 static const char *get_symbol_64(uint32_t sect_offset, SectionRef S,
2523 DisassembleInfo *info, uint64_t &n_value,
2524 uint64_t ReferenceValue = 0) {
2529 // See if there is an external relocation entry at the sect_offset.
2530 bool reloc_found = false;
2532 MachO::any_relocation_info RE;
2533 bool isExtern = false;
2535 for (const RelocationRef &Reloc : S.relocations()) {
2536 uint64_t RelocOffset = Reloc.getOffset();
2537 if (RelocOffset == sect_offset) {
2538 Rel = Reloc.getRawDataRefImpl();
2539 RE = info->O->getRelocation(Rel);
2540 if (info->O->isRelocationScattered(RE))
2542 isExtern = info->O->getPlainRelocationExternal(RE);
2544 symbol_iterator RelocSym = Reloc.getSymbol();
2551 // If there is an external relocation entry for a symbol in this section
2552 // at this section_offset then use that symbol's value for the n_value
2553 // and return its name.
2554 const char *SymbolName = nullptr;
2555 if (reloc_found && isExtern) {
2556 n_value = Symbol.getValue();
2557 Expected<StringRef> NameOrError = Symbol.getName();
2559 report_error(info->O->getFileName(), NameOrError.takeError());
2560 StringRef Name = *NameOrError;
2561 if (!Name.empty()) {
2562 SymbolName = Name.data();
2567 // TODO: For fully linked images, look through the external relocation
2568 // entries off the dynamic symtab command. For these the r_offset is from the
2569 // start of the first writeable segment in the Mach-O file. So the offset
2570 // to this section from that segment is passed to this routine by the caller,
2571 // as the database_offset. Which is the difference of the section's starting
2572 // address and the first writable segment.
2574 // NOTE: need add passing the database_offset to this routine.
2576 // We did not find an external relocation entry so look up the ReferenceValue
2577 // as an address of a symbol and if found return that symbol's name.
2578 SymbolName = GuessSymbolName(ReferenceValue, info->AddrMap);
2583 static const char *get_symbol_32(uint32_t sect_offset, SectionRef S,
2584 DisassembleInfo *info,
2585 uint32_t ReferenceValue) {
2587 return get_symbol_64(sect_offset, S, info, n_value64, ReferenceValue);
2590 // These are structs in the Objective-C meta data and read to produce the
2591 // comments for disassembly. While these are part of the ABI they are no
2592 // public defintions. So the are here not in include/llvm/Support/MachO.h .
2594 // The cfstring object in a 64-bit Mach-O file.
2595 struct cfstring64_t {
2596 uint64_t isa; // class64_t * (64-bit pointer)
2597 uint64_t flags; // flag bits
2598 uint64_t characters; // char * (64-bit pointer)
2599 uint64_t length; // number of non-NULL characters in above
2602 // The class object in a 64-bit Mach-O file.
2604 uint64_t isa; // class64_t * (64-bit pointer)
2605 uint64_t superclass; // class64_t * (64-bit pointer)
2606 uint64_t cache; // Cache (64-bit pointer)
2607 uint64_t vtable; // IMP * (64-bit pointer)
2608 uint64_t data; // class_ro64_t * (64-bit pointer)
2612 uint32_t isa; /* class32_t * (32-bit pointer) */
2613 uint32_t superclass; /* class32_t * (32-bit pointer) */
2614 uint32_t cache; /* Cache (32-bit pointer) */
2615 uint32_t vtable; /* IMP * (32-bit pointer) */
2616 uint32_t data; /* class_ro32_t * (32-bit pointer) */
2619 struct class_ro64_t {
2621 uint32_t instanceStart;
2622 uint32_t instanceSize;
2624 uint64_t ivarLayout; // const uint8_t * (64-bit pointer)
2625 uint64_t name; // const char * (64-bit pointer)
2626 uint64_t baseMethods; // const method_list_t * (64-bit pointer)
2627 uint64_t baseProtocols; // const protocol_list_t * (64-bit pointer)
2628 uint64_t ivars; // const ivar_list_t * (64-bit pointer)
2629 uint64_t weakIvarLayout; // const uint8_t * (64-bit pointer)
2630 uint64_t baseProperties; // const struct objc_property_list (64-bit pointer)
2633 struct class_ro32_t {
2635 uint32_t instanceStart;
2636 uint32_t instanceSize;
2637 uint32_t ivarLayout; /* const uint8_t * (32-bit pointer) */
2638 uint32_t name; /* const char * (32-bit pointer) */
2639 uint32_t baseMethods; /* const method_list_t * (32-bit pointer) */
2640 uint32_t baseProtocols; /* const protocol_list_t * (32-bit pointer) */
2641 uint32_t ivars; /* const ivar_list_t * (32-bit pointer) */
2642 uint32_t weakIvarLayout; /* const uint8_t * (32-bit pointer) */
2643 uint32_t baseProperties; /* const struct objc_property_list *
2647 /* Values for class_ro{64,32}_t->flags */
2648 #define RO_META (1 << 0)
2649 #define RO_ROOT (1 << 1)
2650 #define RO_HAS_CXX_STRUCTORS (1 << 2)
2652 struct method_list64_t {
2655 /* struct method64_t first; These structures follow inline */
2658 struct method_list32_t {
2661 /* struct method32_t first; These structures follow inline */
2665 uint64_t name; /* SEL (64-bit pointer) */
2666 uint64_t types; /* const char * (64-bit pointer) */
2667 uint64_t imp; /* IMP (64-bit pointer) */
2671 uint32_t name; /* SEL (32-bit pointer) */
2672 uint32_t types; /* const char * (32-bit pointer) */
2673 uint32_t imp; /* IMP (32-bit pointer) */
2676 struct protocol_list64_t {
2677 uint64_t count; /* uintptr_t (a 64-bit value) */
2678 /* struct protocol64_t * list[0]; These pointers follow inline */
2681 struct protocol_list32_t {
2682 uint32_t count; /* uintptr_t (a 32-bit value) */
2683 /* struct protocol32_t * list[0]; These pointers follow inline */
2686 struct protocol64_t {
2687 uint64_t isa; /* id * (64-bit pointer) */
2688 uint64_t name; /* const char * (64-bit pointer) */
2689 uint64_t protocols; /* struct protocol_list64_t *
2691 uint64_t instanceMethods; /* method_list_t * (64-bit pointer) */
2692 uint64_t classMethods; /* method_list_t * (64-bit pointer) */
2693 uint64_t optionalInstanceMethods; /* method_list_t * (64-bit pointer) */
2694 uint64_t optionalClassMethods; /* method_list_t * (64-bit pointer) */
2695 uint64_t instanceProperties; /* struct objc_property_list *
2699 struct protocol32_t {
2700 uint32_t isa; /* id * (32-bit pointer) */
2701 uint32_t name; /* const char * (32-bit pointer) */
2702 uint32_t protocols; /* struct protocol_list_t *
2704 uint32_t instanceMethods; /* method_list_t * (32-bit pointer) */
2705 uint32_t classMethods; /* method_list_t * (32-bit pointer) */
2706 uint32_t optionalInstanceMethods; /* method_list_t * (32-bit pointer) */
2707 uint32_t optionalClassMethods; /* method_list_t * (32-bit pointer) */
2708 uint32_t instanceProperties; /* struct objc_property_list *
2712 struct ivar_list64_t {
2715 /* struct ivar64_t first; These structures follow inline */
2718 struct ivar_list32_t {
2721 /* struct ivar32_t first; These structures follow inline */
2725 uint64_t offset; /* uintptr_t * (64-bit pointer) */
2726 uint64_t name; /* const char * (64-bit pointer) */
2727 uint64_t type; /* const char * (64-bit pointer) */
2733 uint32_t offset; /* uintptr_t * (32-bit pointer) */
2734 uint32_t name; /* const char * (32-bit pointer) */
2735 uint32_t type; /* const char * (32-bit pointer) */
2740 struct objc_property_list64 {
2743 /* struct objc_property64 first; These structures follow inline */
2746 struct objc_property_list32 {
2749 /* struct objc_property32 first; These structures follow inline */
2752 struct objc_property64 {
2753 uint64_t name; /* const char * (64-bit pointer) */
2754 uint64_t attributes; /* const char * (64-bit pointer) */
2757 struct objc_property32 {
2758 uint32_t name; /* const char * (32-bit pointer) */
2759 uint32_t attributes; /* const char * (32-bit pointer) */
2762 struct category64_t {
2763 uint64_t name; /* const char * (64-bit pointer) */
2764 uint64_t cls; /* struct class_t * (64-bit pointer) */
2765 uint64_t instanceMethods; /* struct method_list_t * (64-bit pointer) */
2766 uint64_t classMethods; /* struct method_list_t * (64-bit pointer) */
2767 uint64_t protocols; /* struct protocol_list_t * (64-bit pointer) */
2768 uint64_t instanceProperties; /* struct objc_property_list *
2772 struct category32_t {
2773 uint32_t name; /* const char * (32-bit pointer) */
2774 uint32_t cls; /* struct class_t * (32-bit pointer) */
2775 uint32_t instanceMethods; /* struct method_list_t * (32-bit pointer) */
2776 uint32_t classMethods; /* struct method_list_t * (32-bit pointer) */
2777 uint32_t protocols; /* struct protocol_list_t * (32-bit pointer) */
2778 uint32_t instanceProperties; /* struct objc_property_list *
2782 struct objc_image_info64 {
2786 struct objc_image_info32 {
2790 struct imageInfo_t {
2794 /* masks for objc_image_info.flags */
2795 #define OBJC_IMAGE_IS_REPLACEMENT (1 << 0)
2796 #define OBJC_IMAGE_SUPPORTS_GC (1 << 1)
2798 struct message_ref64 {
2799 uint64_t imp; /* IMP (64-bit pointer) */
2800 uint64_t sel; /* SEL (64-bit pointer) */
2803 struct message_ref32 {
2804 uint32_t imp; /* IMP (32-bit pointer) */
2805 uint32_t sel; /* SEL (32-bit pointer) */
2808 // Objective-C 1 (32-bit only) meta data structs.
2810 struct objc_module_t {
2813 uint32_t name; /* char * (32-bit pointer) */
2814 uint32_t symtab; /* struct objc_symtab * (32-bit pointer) */
2817 struct objc_symtab_t {
2818 uint32_t sel_ref_cnt;
2819 uint32_t refs; /* SEL * (32-bit pointer) */
2820 uint16_t cls_def_cnt;
2821 uint16_t cat_def_cnt;
2822 // uint32_t defs[1]; /* void * (32-bit pointer) variable size */
2825 struct objc_class_t {
2826 uint32_t isa; /* struct objc_class * (32-bit pointer) */
2827 uint32_t super_class; /* struct objc_class * (32-bit pointer) */
2828 uint32_t name; /* const char * (32-bit pointer) */
2831 int32_t instance_size;
2832 uint32_t ivars; /* struct objc_ivar_list * (32-bit pointer) */
2833 uint32_t methodLists; /* struct objc_method_list ** (32-bit pointer) */
2834 uint32_t cache; /* struct objc_cache * (32-bit pointer) */
2835 uint32_t protocols; /* struct objc_protocol_list * (32-bit pointer) */
2838 #define CLS_GETINFO(cls, infomask) ((cls)->info & (infomask))
2839 // class is not a metaclass
2840 #define CLS_CLASS 0x1
2841 // class is a metaclass
2842 #define CLS_META 0x2
2844 struct objc_category_t {
2845 uint32_t category_name; /* char * (32-bit pointer) */
2846 uint32_t class_name; /* char * (32-bit pointer) */
2847 uint32_t instance_methods; /* struct objc_method_list * (32-bit pointer) */
2848 uint32_t class_methods; /* struct objc_method_list * (32-bit pointer) */
2849 uint32_t protocols; /* struct objc_protocol_list * (32-bit ptr) */
2852 struct objc_ivar_t {
2853 uint32_t ivar_name; /* char * (32-bit pointer) */
2854 uint32_t ivar_type; /* char * (32-bit pointer) */
2855 int32_t ivar_offset;
2858 struct objc_ivar_list_t {
2860 // struct objc_ivar_t ivar_list[1]; /* variable length structure */
2863 struct objc_method_list_t {
2864 uint32_t obsolete; /* struct objc_method_list * (32-bit pointer) */
2865 int32_t method_count;
2866 // struct objc_method_t method_list[1]; /* variable length structure */
2869 struct objc_method_t {
2870 uint32_t method_name; /* SEL, aka struct objc_selector * (32-bit pointer) */
2871 uint32_t method_types; /* char * (32-bit pointer) */
2872 uint32_t method_imp; /* IMP, aka function pointer, (*IMP)(id, SEL, ...)
2876 struct objc_protocol_list_t {
2877 uint32_t next; /* struct objc_protocol_list * (32-bit pointer) */
2879 // uint32_t list[1]; /* Protocol *, aka struct objc_protocol_t *
2880 // (32-bit pointer) */
2883 struct objc_protocol_t {
2884 uint32_t isa; /* struct objc_class * (32-bit pointer) */
2885 uint32_t protocol_name; /* char * (32-bit pointer) */
2886 uint32_t protocol_list; /* struct objc_protocol_list * (32-bit pointer) */
2887 uint32_t instance_methods; /* struct objc_method_description_list *
2889 uint32_t class_methods; /* struct objc_method_description_list *
2893 struct objc_method_description_list_t {
2895 // struct objc_method_description_t list[1];
2898 struct objc_method_description_t {
2899 uint32_t name; /* SEL, aka struct objc_selector * (32-bit pointer) */
2900 uint32_t types; /* char * (32-bit pointer) */
2903 inline void swapStruct(struct cfstring64_t &cfs) {
2904 sys::swapByteOrder(cfs.isa);
2905 sys::swapByteOrder(cfs.flags);
2906 sys::swapByteOrder(cfs.characters);
2907 sys::swapByteOrder(cfs.length);
2910 inline void swapStruct(struct class64_t &c) {
2911 sys::swapByteOrder(c.isa);
2912 sys::swapByteOrder(c.superclass);
2913 sys::swapByteOrder(c.cache);
2914 sys::swapByteOrder(c.vtable);
2915 sys::swapByteOrder(c.data);
2918 inline void swapStruct(struct class32_t &c) {
2919 sys::swapByteOrder(c.isa);
2920 sys::swapByteOrder(c.superclass);
2921 sys::swapByteOrder(c.cache);
2922 sys::swapByteOrder(c.vtable);
2923 sys::swapByteOrder(c.data);
2926 inline void swapStruct(struct class_ro64_t &cro) {
2927 sys::swapByteOrder(cro.flags);
2928 sys::swapByteOrder(cro.instanceStart);
2929 sys::swapByteOrder(cro.instanceSize);
2930 sys::swapByteOrder(cro.reserved);
2931 sys::swapByteOrder(cro.ivarLayout);
2932 sys::swapByteOrder(cro.name);
2933 sys::swapByteOrder(cro.baseMethods);
2934 sys::swapByteOrder(cro.baseProtocols);
2935 sys::swapByteOrder(cro.ivars);
2936 sys::swapByteOrder(cro.weakIvarLayout);
2937 sys::swapByteOrder(cro.baseProperties);
2940 inline void swapStruct(struct class_ro32_t &cro) {
2941 sys::swapByteOrder(cro.flags);
2942 sys::swapByteOrder(cro.instanceStart);
2943 sys::swapByteOrder(cro.instanceSize);
2944 sys::swapByteOrder(cro.ivarLayout);
2945 sys::swapByteOrder(cro.name);
2946 sys::swapByteOrder(cro.baseMethods);
2947 sys::swapByteOrder(cro.baseProtocols);
2948 sys::swapByteOrder(cro.ivars);
2949 sys::swapByteOrder(cro.weakIvarLayout);
2950 sys::swapByteOrder(cro.baseProperties);
2953 inline void swapStruct(struct method_list64_t &ml) {
2954 sys::swapByteOrder(ml.entsize);
2955 sys::swapByteOrder(ml.count);
2958 inline void swapStruct(struct method_list32_t &ml) {
2959 sys::swapByteOrder(ml.entsize);
2960 sys::swapByteOrder(ml.count);
2963 inline void swapStruct(struct method64_t &m) {
2964 sys::swapByteOrder(m.name);
2965 sys::swapByteOrder(m.types);
2966 sys::swapByteOrder(m.imp);
2969 inline void swapStruct(struct method32_t &m) {
2970 sys::swapByteOrder(m.name);
2971 sys::swapByteOrder(m.types);
2972 sys::swapByteOrder(m.imp);
2975 inline void swapStruct(struct protocol_list64_t &pl) {
2976 sys::swapByteOrder(pl.count);
2979 inline void swapStruct(struct protocol_list32_t &pl) {
2980 sys::swapByteOrder(pl.count);
2983 inline void swapStruct(struct protocol64_t &p) {
2984 sys::swapByteOrder(p.isa);
2985 sys::swapByteOrder(p.name);
2986 sys::swapByteOrder(p.protocols);
2987 sys::swapByteOrder(p.instanceMethods);
2988 sys::swapByteOrder(p.classMethods);
2989 sys::swapByteOrder(p.optionalInstanceMethods);
2990 sys::swapByteOrder(p.optionalClassMethods);
2991 sys::swapByteOrder(p.instanceProperties);
2994 inline void swapStruct(struct protocol32_t &p) {
2995 sys::swapByteOrder(p.isa);
2996 sys::swapByteOrder(p.name);
2997 sys::swapByteOrder(p.protocols);
2998 sys::swapByteOrder(p.instanceMethods);
2999 sys::swapByteOrder(p.classMethods);
3000 sys::swapByteOrder(p.optionalInstanceMethods);
3001 sys::swapByteOrder(p.optionalClassMethods);
3002 sys::swapByteOrder(p.instanceProperties);
3005 inline void swapStruct(struct ivar_list64_t &il) {
3006 sys::swapByteOrder(il.entsize);
3007 sys::swapByteOrder(il.count);
3010 inline void swapStruct(struct ivar_list32_t &il) {
3011 sys::swapByteOrder(il.entsize);
3012 sys::swapByteOrder(il.count);
3015 inline void swapStruct(struct ivar64_t &i) {
3016 sys::swapByteOrder(i.offset);
3017 sys::swapByteOrder(i.name);
3018 sys::swapByteOrder(i.type);
3019 sys::swapByteOrder(i.alignment);
3020 sys::swapByteOrder(i.size);
3023 inline void swapStruct(struct ivar32_t &i) {
3024 sys::swapByteOrder(i.offset);
3025 sys::swapByteOrder(i.name);
3026 sys::swapByteOrder(i.type);
3027 sys::swapByteOrder(i.alignment);
3028 sys::swapByteOrder(i.size);
3031 inline void swapStruct(struct objc_property_list64 &pl) {
3032 sys::swapByteOrder(pl.entsize);
3033 sys::swapByteOrder(pl.count);
3036 inline void swapStruct(struct objc_property_list32 &pl) {
3037 sys::swapByteOrder(pl.entsize);
3038 sys::swapByteOrder(pl.count);
3041 inline void swapStruct(struct objc_property64 &op) {
3042 sys::swapByteOrder(op.name);
3043 sys::swapByteOrder(op.attributes);
3046 inline void swapStruct(struct objc_property32 &op) {
3047 sys::swapByteOrder(op.name);
3048 sys::swapByteOrder(op.attributes);
3051 inline void swapStruct(struct category64_t &c) {
3052 sys::swapByteOrder(c.name);
3053 sys::swapByteOrder(c.cls);
3054 sys::swapByteOrder(c.instanceMethods);
3055 sys::swapByteOrder(c.classMethods);
3056 sys::swapByteOrder(c.protocols);
3057 sys::swapByteOrder(c.instanceProperties);
3060 inline void swapStruct(struct category32_t &c) {
3061 sys::swapByteOrder(c.name);
3062 sys::swapByteOrder(c.cls);
3063 sys::swapByteOrder(c.instanceMethods);
3064 sys::swapByteOrder(c.classMethods);
3065 sys::swapByteOrder(c.protocols);
3066 sys::swapByteOrder(c.instanceProperties);
3069 inline void swapStruct(struct objc_image_info64 &o) {
3070 sys::swapByteOrder(o.version);
3071 sys::swapByteOrder(o.flags);
3074 inline void swapStruct(struct objc_image_info32 &o) {
3075 sys::swapByteOrder(o.version);
3076 sys::swapByteOrder(o.flags);
3079 inline void swapStruct(struct imageInfo_t &o) {
3080 sys::swapByteOrder(o.version);
3081 sys::swapByteOrder(o.flags);
3084 inline void swapStruct(struct message_ref64 &mr) {
3085 sys::swapByteOrder(mr.imp);
3086 sys::swapByteOrder(mr.sel);
3089 inline void swapStruct(struct message_ref32 &mr) {
3090 sys::swapByteOrder(mr.imp);
3091 sys::swapByteOrder(mr.sel);
3094 inline void swapStruct(struct objc_module_t &module) {
3095 sys::swapByteOrder(module.version);
3096 sys::swapByteOrder(module.size);
3097 sys::swapByteOrder(module.name);
3098 sys::swapByteOrder(module.symtab);
3101 inline void swapStruct(struct objc_symtab_t &symtab) {
3102 sys::swapByteOrder(symtab.sel_ref_cnt);
3103 sys::swapByteOrder(symtab.refs);
3104 sys::swapByteOrder(symtab.cls_def_cnt);
3105 sys::swapByteOrder(symtab.cat_def_cnt);
3108 inline void swapStruct(struct objc_class_t &objc_class) {
3109 sys::swapByteOrder(objc_class.isa);
3110 sys::swapByteOrder(objc_class.super_class);
3111 sys::swapByteOrder(objc_class.name);
3112 sys::swapByteOrder(objc_class.version);
3113 sys::swapByteOrder(objc_class.info);
3114 sys::swapByteOrder(objc_class.instance_size);
3115 sys::swapByteOrder(objc_class.ivars);
3116 sys::swapByteOrder(objc_class.methodLists);
3117 sys::swapByteOrder(objc_class.cache);
3118 sys::swapByteOrder(objc_class.protocols);
3121 inline void swapStruct(struct objc_category_t &objc_category) {
3122 sys::swapByteOrder(objc_category.category_name);
3123 sys::swapByteOrder(objc_category.class_name);
3124 sys::swapByteOrder(objc_category.instance_methods);
3125 sys::swapByteOrder(objc_category.class_methods);
3126 sys::swapByteOrder(objc_category.protocols);
3129 inline void swapStruct(struct objc_ivar_list_t &objc_ivar_list) {
3130 sys::swapByteOrder(objc_ivar_list.ivar_count);
3133 inline void swapStruct(struct objc_ivar_t &objc_ivar) {
3134 sys::swapByteOrder(objc_ivar.ivar_name);
3135 sys::swapByteOrder(objc_ivar.ivar_type);
3136 sys::swapByteOrder(objc_ivar.ivar_offset);
3139 inline void swapStruct(struct objc_method_list_t &method_list) {
3140 sys::swapByteOrder(method_list.obsolete);
3141 sys::swapByteOrder(method_list.method_count);
3144 inline void swapStruct(struct objc_method_t &method) {
3145 sys::swapByteOrder(method.method_name);
3146 sys::swapByteOrder(method.method_types);
3147 sys::swapByteOrder(method.method_imp);
3150 inline void swapStruct(struct objc_protocol_list_t &protocol_list) {
3151 sys::swapByteOrder(protocol_list.next);
3152 sys::swapByteOrder(protocol_list.count);
3155 inline void swapStruct(struct objc_protocol_t &protocol) {
3156 sys::swapByteOrder(protocol.isa);
3157 sys::swapByteOrder(protocol.protocol_name);
3158 sys::swapByteOrder(protocol.protocol_list);
3159 sys::swapByteOrder(protocol.instance_methods);
3160 sys::swapByteOrder(protocol.class_methods);
3163 inline void swapStruct(struct objc_method_description_list_t &mdl) {
3164 sys::swapByteOrder(mdl.count);
3167 inline void swapStruct(struct objc_method_description_t &md) {
3168 sys::swapByteOrder(md.name);
3169 sys::swapByteOrder(md.types);
3172 static const char *get_dyld_bind_info_symbolname(uint64_t ReferenceValue,
3173 struct DisassembleInfo *info);
3175 // get_objc2_64bit_class_name() is used for disassembly and is passed a pointer
3176 // to an Objective-C class and returns the class name. It is also passed the
3177 // address of the pointer, so when the pointer is zero as it can be in an .o
3178 // file, that is used to look for an external relocation entry with a symbol
3180 static const char *get_objc2_64bit_class_name(uint64_t pointer_value,
3181 uint64_t ReferenceValue,
3182 struct DisassembleInfo *info) {
3184 uint32_t offset, left;
3187 // The pointer_value can be 0 in an object file and have a relocation
3188 // entry for the class symbol at the ReferenceValue (the address of the
3190 if (pointer_value == 0) {
3191 r = get_pointer_64(ReferenceValue, offset, left, S, info);
3192 if (r == nullptr || left < sizeof(uint64_t))
3195 const char *symbol_name = get_symbol_64(offset, S, info, n_value);
3196 if (symbol_name == nullptr)
3198 const char *class_name = strrchr(symbol_name, '$');
3199 if (class_name != nullptr && class_name[1] == '_' && class_name[2] != '\0')
3200 return class_name + 2;
3205 // The case were the pointer_value is non-zero and points to a class defined
3206 // in this Mach-O file.
3207 r = get_pointer_64(pointer_value, offset, left, S, info);
3208 if (r == nullptr || left < sizeof(struct class64_t))
3211 memcpy(&c, r, sizeof(struct class64_t));
3212 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3216 r = get_pointer_64(c.data, offset, left, S, info);
3217 if (r == nullptr || left < sizeof(struct class_ro64_t))
3219 struct class_ro64_t cro;
3220 memcpy(&cro, r, sizeof(struct class_ro64_t));
3221 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3225 const char *name = get_pointer_64(cro.name, offset, left, S, info);
3229 // get_objc2_64bit_cfstring_name is used for disassembly and is passed a
3230 // pointer to a cfstring and returns its name or nullptr.
3231 static const char *get_objc2_64bit_cfstring_name(uint64_t ReferenceValue,
3232 struct DisassembleInfo *info) {
3233 const char *r, *name;
3234 uint32_t offset, left;
3236 struct cfstring64_t cfs;
3237 uint64_t cfs_characters;
3239 r = get_pointer_64(ReferenceValue, offset, left, S, info);
3240 if (r == nullptr || left < sizeof(struct cfstring64_t))
3242 memcpy(&cfs, r, sizeof(struct cfstring64_t));
3243 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3245 if (cfs.characters == 0) {
3247 const char *symbol_name = get_symbol_64(
3248 offset + offsetof(struct cfstring64_t, characters), S, info, n_value);
3249 if (symbol_name == nullptr)
3251 cfs_characters = n_value;
3253 cfs_characters = cfs.characters;
3254 name = get_pointer_64(cfs_characters, offset, left, S, info);
3259 // get_objc2_64bit_selref() is used for disassembly and is passed a the address
3260 // of a pointer to an Objective-C selector reference when the pointer value is
3261 // zero as in a .o file and is likely to have a external relocation entry with
3262 // who's symbol's n_value is the real pointer to the selector name. If that is
3263 // the case the real pointer to the selector name is returned else 0 is
3265 static uint64_t get_objc2_64bit_selref(uint64_t ReferenceValue,
3266 struct DisassembleInfo *info) {
3267 uint32_t offset, left;
3270 const char *r = get_pointer_64(ReferenceValue, offset, left, S, info);
3271 if (r == nullptr || left < sizeof(uint64_t))
3274 const char *symbol_name = get_symbol_64(offset, S, info, n_value);
3275 if (symbol_name == nullptr)
3280 static const SectionRef get_section(MachOObjectFile *O, const char *segname,
3281 const char *sectname) {
3282 for (const SectionRef &Section : O->sections()) {
3284 Section.getName(SectName);
3285 DataRefImpl Ref = Section.getRawDataRefImpl();
3286 StringRef SegName = O->getSectionFinalSegmentName(Ref);
3287 if (SegName == segname && SectName == sectname)
3290 return SectionRef();
3294 walk_pointer_list_64(const char *listname, const SectionRef S,
3295 MachOObjectFile *O, struct DisassembleInfo *info,
3296 void (*func)(uint64_t, struct DisassembleInfo *info)) {
3297 if (S == SectionRef())
3301 S.getName(SectName);
3302 DataRefImpl Ref = S.getRawDataRefImpl();
3303 StringRef SegName = O->getSectionFinalSegmentName(Ref);
3304 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
3307 S.getContents(BytesStr);
3308 const char *Contents = reinterpret_cast<const char *>(BytesStr.data());
3310 for (uint32_t i = 0; i < S.getSize(); i += sizeof(uint64_t)) {
3311 uint32_t left = S.getSize() - i;
3312 uint32_t size = left < sizeof(uint64_t) ? left : sizeof(uint64_t);
3314 memcpy(&p, Contents + i, size);
3315 if (i + sizeof(uint64_t) > S.getSize())
3316 outs() << listname << " list pointer extends past end of (" << SegName
3317 << "," << SectName << ") section\n";
3318 outs() << format("%016" PRIx64, S.getAddress() + i) << " ";
3320 if (O->isLittleEndian() != sys::IsLittleEndianHost)
3321 sys::swapByteOrder(p);
3323 uint64_t n_value = 0;
3324 const char *name = get_symbol_64(i, S, info, n_value, p);
3325 if (name == nullptr)
3326 name = get_dyld_bind_info_symbolname(S.getAddress() + i, info);
3329 outs() << format("0x%" PRIx64, n_value);
3331 outs() << " + " << format("0x%" PRIx64, p);
3333 outs() << format("0x%" PRIx64, p);
3334 if (name != nullptr)
3335 outs() << " " << name;
3345 walk_pointer_list_32(const char *listname, const SectionRef S,
3346 MachOObjectFile *O, struct DisassembleInfo *info,
3347 void (*func)(uint32_t, struct DisassembleInfo *info)) {
3348 if (S == SectionRef())
3352 S.getName(SectName);
3353 DataRefImpl Ref = S.getRawDataRefImpl();
3354 StringRef SegName = O->getSectionFinalSegmentName(Ref);
3355 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
3358 S.getContents(BytesStr);
3359 const char *Contents = reinterpret_cast<const char *>(BytesStr.data());
3361 for (uint32_t i = 0; i < S.getSize(); i += sizeof(uint32_t)) {
3362 uint32_t left = S.getSize() - i;
3363 uint32_t size = left < sizeof(uint32_t) ? left : sizeof(uint32_t);
3365 memcpy(&p, Contents + i, size);
3366 if (i + sizeof(uint32_t) > S.getSize())
3367 outs() << listname << " list pointer extends past end of (" << SegName
3368 << "," << SectName << ") section\n";
3369 uint32_t Address = S.getAddress() + i;
3370 outs() << format("%08" PRIx32, Address) << " ";
3372 if (O->isLittleEndian() != sys::IsLittleEndianHost)
3373 sys::swapByteOrder(p);
3374 outs() << format("0x%" PRIx32, p);
3376 const char *name = get_symbol_32(i, S, info, p);
3377 if (name != nullptr)
3378 outs() << " " << name;
3386 static void print_layout_map(const char *layout_map, uint32_t left) {
3387 if (layout_map == nullptr)
3389 outs() << " layout map: ";
3391 outs() << format("0x%02" PRIx32, (*layout_map) & 0xff) << " ";
3394 } while (*layout_map != '\0' && left != 0);
3398 static void print_layout_map64(uint64_t p, struct DisassembleInfo *info) {
3399 uint32_t offset, left;
3401 const char *layout_map;
3405 layout_map = get_pointer_64(p, offset, left, S, info);
3406 print_layout_map(layout_map, left);
3409 static void print_layout_map32(uint32_t p, struct DisassembleInfo *info) {
3410 uint32_t offset, left;
3412 const char *layout_map;
3416 layout_map = get_pointer_32(p, offset, left, S, info);
3417 print_layout_map(layout_map, left);
3420 static void print_method_list64_t(uint64_t p, struct DisassembleInfo *info,
3421 const char *indent) {
3422 struct method_list64_t ml;
3423 struct method64_t m;
3425 uint32_t offset, xoffset, left, i;
3427 const char *name, *sym_name;
3430 r = get_pointer_64(p, offset, left, S, info);
3433 memset(&ml, '\0', sizeof(struct method_list64_t));
3434 if (left < sizeof(struct method_list64_t)) {
3435 memcpy(&ml, r, left);
3436 outs() << " (method_list_t entends past the end of the section)\n";
3438 memcpy(&ml, r, sizeof(struct method_list64_t));
3439 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3441 outs() << indent << "\t\t entsize " << ml.entsize << "\n";
3442 outs() << indent << "\t\t count " << ml.count << "\n";
3444 p += sizeof(struct method_list64_t);
3445 offset += sizeof(struct method_list64_t);
3446 for (i = 0; i < ml.count; i++) {
3447 r = get_pointer_64(p, offset, left, S, info);
3450 memset(&m, '\0', sizeof(struct method64_t));
3451 if (left < sizeof(struct method64_t)) {
3452 memcpy(&m, r, left);
3453 outs() << indent << " (method_t extends past the end of the section)\n";
3455 memcpy(&m, r, sizeof(struct method64_t));
3456 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3459 outs() << indent << "\t\t name ";
3460 sym_name = get_symbol_64(offset + offsetof(struct method64_t, name), S,
3461 info, n_value, m.name);
3463 if (info->verbose && sym_name != nullptr)
3466 outs() << format("0x%" PRIx64, n_value);
3468 outs() << " + " << format("0x%" PRIx64, m.name);
3470 outs() << format("0x%" PRIx64, m.name);
3471 name = get_pointer_64(m.name + n_value, xoffset, left, xS, info);
3472 if (name != nullptr)
3473 outs() << format(" %.*s", left, name);
3476 outs() << indent << "\t\t types ";
3477 sym_name = get_symbol_64(offset + offsetof(struct method64_t, types), S,
3478 info, n_value, m.types);
3480 if (info->verbose && sym_name != nullptr)
3483 outs() << format("0x%" PRIx64, n_value);
3485 outs() << " + " << format("0x%" PRIx64, m.types);
3487 outs() << format("0x%" PRIx64, m.types);
3488 name = get_pointer_64(m.types + n_value, xoffset, left, xS, info);
3489 if (name != nullptr)
3490 outs() << format(" %.*s", left, name);
3493 outs() << indent << "\t\t imp ";
3494 name = get_symbol_64(offset + offsetof(struct method64_t, imp), S, info,
3496 if (info->verbose && name == nullptr) {
3498 outs() << format("0x%" PRIx64, n_value) << " ";
3500 outs() << "+ " << format("0x%" PRIx64, m.imp) << " ";
3502 outs() << format("0x%" PRIx64, m.imp) << " ";
3504 if (name != nullptr)
3508 p += sizeof(struct method64_t);
3509 offset += sizeof(struct method64_t);
3513 static void print_method_list32_t(uint64_t p, struct DisassembleInfo *info,
3514 const char *indent) {
3515 struct method_list32_t ml;
3516 struct method32_t m;
3517 const char *r, *name;
3518 uint32_t offset, xoffset, left, i;
3521 r = get_pointer_32(p, offset, left, S, info);
3524 memset(&ml, '\0', sizeof(struct method_list32_t));
3525 if (left < sizeof(struct method_list32_t)) {
3526 memcpy(&ml, r, left);
3527 outs() << " (method_list_t entends past the end of the section)\n";
3529 memcpy(&ml, r, sizeof(struct method_list32_t));
3530 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3532 outs() << indent << "\t\t entsize " << ml.entsize << "\n";
3533 outs() << indent << "\t\t count " << ml.count << "\n";
3535 p += sizeof(struct method_list32_t);
3536 offset += sizeof(struct method_list32_t);
3537 for (i = 0; i < ml.count; i++) {
3538 r = get_pointer_32(p, offset, left, S, info);
3541 memset(&m, '\0', sizeof(struct method32_t));
3542 if (left < sizeof(struct method32_t)) {
3543 memcpy(&ml, r, left);
3544 outs() << indent << " (method_t entends past the end of the section)\n";
3546 memcpy(&m, r, sizeof(struct method32_t));
3547 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3550 outs() << indent << "\t\t name " << format("0x%" PRIx32, m.name);
3551 name = get_pointer_32(m.name, xoffset, left, xS, info);
3552 if (name != nullptr)
3553 outs() << format(" %.*s", left, name);
3556 outs() << indent << "\t\t types " << format("0x%" PRIx32, m.types);
3557 name = get_pointer_32(m.types, xoffset, left, xS, info);
3558 if (name != nullptr)
3559 outs() << format(" %.*s", left, name);
3562 outs() << indent << "\t\t imp " << format("0x%" PRIx32, m.imp);
3563 name = get_symbol_32(offset + offsetof(struct method32_t, imp), S, info,
3565 if (name != nullptr)
3566 outs() << " " << name;
3569 p += sizeof(struct method32_t);
3570 offset += sizeof(struct method32_t);
3574 static bool print_method_list(uint32_t p, struct DisassembleInfo *info) {
3575 uint32_t offset, left, xleft;
3577 struct objc_method_list_t method_list;
3578 struct objc_method_t method;
3579 const char *r, *methods, *name, *SymbolName;
3582 r = get_pointer_32(p, offset, left, S, info, true);
3587 if (left > sizeof(struct objc_method_list_t)) {
3588 memcpy(&method_list, r, sizeof(struct objc_method_list_t));
3590 outs() << "\t\t objc_method_list extends past end of the section\n";
3591 memset(&method_list, '\0', sizeof(struct objc_method_list_t));
3592 memcpy(&method_list, r, left);
3594 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3595 swapStruct(method_list);
3597 outs() << "\t\t obsolete "
3598 << format("0x%08" PRIx32, method_list.obsolete) << "\n";
3599 outs() << "\t\t method_count " << method_list.method_count << "\n";
3601 methods = r + sizeof(struct objc_method_list_t);
3602 for (i = 0; i < method_list.method_count; i++) {
3603 if ((i + 1) * sizeof(struct objc_method_t) > left) {
3604 outs() << "\t\t remaining method's extend past the of the section\n";
3607 memcpy(&method, methods + i * sizeof(struct objc_method_t),
3608 sizeof(struct objc_method_t));
3609 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3612 outs() << "\t\t method_name "
3613 << format("0x%08" PRIx32, method.method_name);
3614 if (info->verbose) {
3615 name = get_pointer_32(method.method_name, offset, xleft, S, info, true);
3616 if (name != nullptr)
3617 outs() << format(" %.*s", xleft, name);
3619 outs() << " (not in an __OBJC section)";
3623 outs() << "\t\t method_types "
3624 << format("0x%08" PRIx32, method.method_types);
3625 if (info->verbose) {
3626 name = get_pointer_32(method.method_types, offset, xleft, S, info, true);
3627 if (name != nullptr)
3628 outs() << format(" %.*s", xleft, name);
3630 outs() << " (not in an __OBJC section)";
3634 outs() << "\t\t method_imp "
3635 << format("0x%08" PRIx32, method.method_imp) << " ";
3636 if (info->verbose) {
3637 SymbolName = GuessSymbolName(method.method_imp, info->AddrMap);
3638 if (SymbolName != nullptr)
3639 outs() << SymbolName;
3646 static void print_protocol_list64_t(uint64_t p, struct DisassembleInfo *info) {
3647 struct protocol_list64_t pl;
3648 uint64_t q, n_value;
3649 struct protocol64_t pc;
3651 uint32_t offset, xoffset, left, i;
3653 const char *name, *sym_name;
3655 r = get_pointer_64(p, offset, left, S, info);
3658 memset(&pl, '\0', sizeof(struct protocol_list64_t));
3659 if (left < sizeof(struct protocol_list64_t)) {
3660 memcpy(&pl, r, left);
3661 outs() << " (protocol_list_t entends past the end of the section)\n";
3663 memcpy(&pl, r, sizeof(struct protocol_list64_t));
3664 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3666 outs() << " count " << pl.count << "\n";
3668 p += sizeof(struct protocol_list64_t);
3669 offset += sizeof(struct protocol_list64_t);
3670 for (i = 0; i < pl.count; i++) {
3671 r = get_pointer_64(p, offset, left, S, info);
3675 if (left < sizeof(uint64_t)) {
3676 memcpy(&q, r, left);
3677 outs() << " (protocol_t * entends past the end of the section)\n";
3679 memcpy(&q, r, sizeof(uint64_t));
3680 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3681 sys::swapByteOrder(q);
3683 outs() << "\t\t list[" << i << "] ";
3684 sym_name = get_symbol_64(offset, S, info, n_value, q);
3686 if (info->verbose && sym_name != nullptr)
3689 outs() << format("0x%" PRIx64, n_value);
3691 outs() << " + " << format("0x%" PRIx64, q);
3693 outs() << format("0x%" PRIx64, q);
3694 outs() << " (struct protocol_t *)\n";
3696 r = get_pointer_64(q + n_value, offset, left, S, info);
3699 memset(&pc, '\0', sizeof(struct protocol64_t));
3700 if (left < sizeof(struct protocol64_t)) {
3701 memcpy(&pc, r, left);
3702 outs() << " (protocol_t entends past the end of the section)\n";
3704 memcpy(&pc, r, sizeof(struct protocol64_t));
3705 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3708 outs() << "\t\t\t isa " << format("0x%" PRIx64, pc.isa) << "\n";
3710 outs() << "\t\t\t name ";
3711 sym_name = get_symbol_64(offset + offsetof(struct protocol64_t, name), S,
3712 info, n_value, pc.name);
3714 if (info->verbose && sym_name != nullptr)
3717 outs() << format("0x%" PRIx64, n_value);
3719 outs() << " + " << format("0x%" PRIx64, pc.name);
3721 outs() << format("0x%" PRIx64, pc.name);
3722 name = get_pointer_64(pc.name + n_value, xoffset, left, xS, info);
3723 if (name != nullptr)
3724 outs() << format(" %.*s", left, name);
3727 outs() << "\t\t\tprotocols " << format("0x%" PRIx64, pc.protocols) << "\n";
3729 outs() << "\t\t instanceMethods ";
3731 get_symbol_64(offset + offsetof(struct protocol64_t, instanceMethods),
3732 S, info, n_value, pc.instanceMethods);
3734 if (info->verbose && sym_name != nullptr)
3737 outs() << format("0x%" PRIx64, n_value);
3738 if (pc.instanceMethods != 0)
3739 outs() << " + " << format("0x%" PRIx64, pc.instanceMethods);
3741 outs() << format("0x%" PRIx64, pc.instanceMethods);
3742 outs() << " (struct method_list_t *)\n";
3743 if (pc.instanceMethods + n_value != 0)
3744 print_method_list64_t(pc.instanceMethods + n_value, info, "\t");
3746 outs() << "\t\t classMethods ";
3748 get_symbol_64(offset + offsetof(struct protocol64_t, classMethods), S,
3749 info, n_value, pc.classMethods);
3751 if (info->verbose && sym_name != nullptr)
3754 outs() << format("0x%" PRIx64, n_value);
3755 if (pc.classMethods != 0)
3756 outs() << " + " << format("0x%" PRIx64, pc.classMethods);
3758 outs() << format("0x%" PRIx64, pc.classMethods);
3759 outs() << " (struct method_list_t *)\n";
3760 if (pc.classMethods + n_value != 0)
3761 print_method_list64_t(pc.classMethods + n_value, info, "\t");
3763 outs() << "\t optionalInstanceMethods "
3764 << format("0x%" PRIx64, pc.optionalInstanceMethods) << "\n";
3765 outs() << "\t optionalClassMethods "
3766 << format("0x%" PRIx64, pc.optionalClassMethods) << "\n";
3767 outs() << "\t instanceProperties "
3768 << format("0x%" PRIx64, pc.instanceProperties) << "\n";
3770 p += sizeof(uint64_t);
3771 offset += sizeof(uint64_t);
3775 static void print_protocol_list32_t(uint32_t p, struct DisassembleInfo *info) {
3776 struct protocol_list32_t pl;
3778 struct protocol32_t pc;
3780 uint32_t offset, xoffset, left, i;
3784 r = get_pointer_32(p, offset, left, S, info);
3787 memset(&pl, '\0', sizeof(struct protocol_list32_t));
3788 if (left < sizeof(struct protocol_list32_t)) {
3789 memcpy(&pl, r, left);
3790 outs() << " (protocol_list_t entends past the end of the section)\n";
3792 memcpy(&pl, r, sizeof(struct protocol_list32_t));
3793 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3795 outs() << " count " << pl.count << "\n";
3797 p += sizeof(struct protocol_list32_t);
3798 offset += sizeof(struct protocol_list32_t);
3799 for (i = 0; i < pl.count; i++) {
3800 r = get_pointer_32(p, offset, left, S, info);
3804 if (left < sizeof(uint32_t)) {
3805 memcpy(&q, r, left);
3806 outs() << " (protocol_t * entends past the end of the section)\n";
3808 memcpy(&q, r, sizeof(uint32_t));
3809 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3810 sys::swapByteOrder(q);
3811 outs() << "\t\t list[" << i << "] " << format("0x%" PRIx32, q)
3812 << " (struct protocol_t *)\n";
3813 r = get_pointer_32(q, offset, left, S, info);
3816 memset(&pc, '\0', sizeof(struct protocol32_t));
3817 if (left < sizeof(struct protocol32_t)) {
3818 memcpy(&pc, r, left);
3819 outs() << " (protocol_t entends past the end of the section)\n";
3821 memcpy(&pc, r, sizeof(struct protocol32_t));
3822 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3824 outs() << "\t\t\t isa " << format("0x%" PRIx32, pc.isa) << "\n";
3825 outs() << "\t\t\t name " << format("0x%" PRIx32, pc.name);
3826 name = get_pointer_32(pc.name, xoffset, left, xS, info);
3827 if (name != nullptr)
3828 outs() << format(" %.*s", left, name);
3830 outs() << "\t\t\tprotocols " << format("0x%" PRIx32, pc.protocols) << "\n";
3831 outs() << "\t\t instanceMethods "
3832 << format("0x%" PRIx32, pc.instanceMethods)
3833 << " (struct method_list_t *)\n";
3834 if (pc.instanceMethods != 0)
3835 print_method_list32_t(pc.instanceMethods, info, "\t");
3836 outs() << "\t\t classMethods " << format("0x%" PRIx32, pc.classMethods)
3837 << " (struct method_list_t *)\n";
3838 if (pc.classMethods != 0)
3839 print_method_list32_t(pc.classMethods, info, "\t");
3840 outs() << "\t optionalInstanceMethods "
3841 << format("0x%" PRIx32, pc.optionalInstanceMethods) << "\n";
3842 outs() << "\t optionalClassMethods "
3843 << format("0x%" PRIx32, pc.optionalClassMethods) << "\n";
3844 outs() << "\t instanceProperties "
3845 << format("0x%" PRIx32, pc.instanceProperties) << "\n";
3846 p += sizeof(uint32_t);
3847 offset += sizeof(uint32_t);
3851 static void print_indent(uint32_t indent) {
3852 for (uint32_t i = 0; i < indent;) {
3853 if (indent - i >= 8) {
3857 for (uint32_t j = i; j < indent; j++)
3864 static bool print_method_description_list(uint32_t p, uint32_t indent,
3865 struct DisassembleInfo *info) {
3866 uint32_t offset, left, xleft;
3868 struct objc_method_description_list_t mdl;
3869 struct objc_method_description_t md;
3870 const char *r, *list, *name;
3873 r = get_pointer_32(p, offset, left, S, info, true);
3878 if (left > sizeof(struct objc_method_description_list_t)) {
3879 memcpy(&mdl, r, sizeof(struct objc_method_description_list_t));
3881 print_indent(indent);
3882 outs() << " objc_method_description_list extends past end of the section\n";
3883 memset(&mdl, '\0', sizeof(struct objc_method_description_list_t));
3884 memcpy(&mdl, r, left);
3886 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3889 print_indent(indent);
3890 outs() << " count " << mdl.count << "\n";
3892 list = r + sizeof(struct objc_method_description_list_t);
3893 for (i = 0; i < mdl.count; i++) {
3894 if ((i + 1) * sizeof(struct objc_method_description_t) > left) {
3895 print_indent(indent);
3896 outs() << " remaining list entries extend past the of the section\n";
3899 print_indent(indent);
3900 outs() << " list[" << i << "]\n";
3901 memcpy(&md, list + i * sizeof(struct objc_method_description_t),
3902 sizeof(struct objc_method_description_t));
3903 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3906 print_indent(indent);
3907 outs() << " name " << format("0x%08" PRIx32, md.name);
3908 if (info->verbose) {
3909 name = get_pointer_32(md.name, offset, xleft, S, info, true);
3910 if (name != nullptr)
3911 outs() << format(" %.*s", xleft, name);
3913 outs() << " (not in an __OBJC section)";
3917 print_indent(indent);
3918 outs() << " types " << format("0x%08" PRIx32, md.types);
3919 if (info->verbose) {
3920 name = get_pointer_32(md.types, offset, xleft, S, info, true);
3921 if (name != nullptr)
3922 outs() << format(" %.*s", xleft, name);
3924 outs() << " (not in an __OBJC section)";
3931 static bool print_protocol_list(uint32_t p, uint32_t indent,
3932 struct DisassembleInfo *info);
3934 static bool print_protocol(uint32_t p, uint32_t indent,
3935 struct DisassembleInfo *info) {
3936 uint32_t offset, left;
3938 struct objc_protocol_t protocol;
3939 const char *r, *name;
3941 r = get_pointer_32(p, offset, left, S, info, true);
3946 if (left >= sizeof(struct objc_protocol_t)) {
3947 memcpy(&protocol, r, sizeof(struct objc_protocol_t));
3949 print_indent(indent);
3950 outs() << " Protocol extends past end of the section\n";
3951 memset(&protocol, '\0', sizeof(struct objc_protocol_t));
3952 memcpy(&protocol, r, left);
3954 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
3955 swapStruct(protocol);
3957 print_indent(indent);
3958 outs() << " isa " << format("0x%08" PRIx32, protocol.isa)
3961 print_indent(indent);
3962 outs() << " protocol_name "
3963 << format("0x%08" PRIx32, protocol.protocol_name);
3964 if (info->verbose) {
3965 name = get_pointer_32(protocol.protocol_name, offset, left, S, info, true);
3966 if (name != nullptr)
3967 outs() << format(" %.*s", left, name);
3969 outs() << " (not in an __OBJC section)";
3973 print_indent(indent);
3974 outs() << " protocol_list "
3975 << format("0x%08" PRIx32, protocol.protocol_list);
3976 if (print_protocol_list(protocol.protocol_list, indent + 4, info))
3977 outs() << " (not in an __OBJC section)\n";
3979 print_indent(indent);
3980 outs() << " instance_methods "
3981 << format("0x%08" PRIx32, protocol.instance_methods);
3982 if (print_method_description_list(protocol.instance_methods, indent, info))
3983 outs() << " (not in an __OBJC section)\n";
3985 print_indent(indent);
3986 outs() << " class_methods "
3987 << format("0x%08" PRIx32, protocol.class_methods);
3988 if (print_method_description_list(protocol.class_methods, indent, info))
3989 outs() << " (not in an __OBJC section)\n";
3994 static bool print_protocol_list(uint32_t p, uint32_t indent,
3995 struct DisassembleInfo *info) {
3996 uint32_t offset, left, l;
3998 struct objc_protocol_list_t protocol_list;
3999 const char *r, *list;
4002 r = get_pointer_32(p, offset, left, S, info, true);
4007 if (left > sizeof(struct objc_protocol_list_t)) {
4008 memcpy(&protocol_list, r, sizeof(struct objc_protocol_list_t));
4010 outs() << "\t\t objc_protocol_list_t extends past end of the section\n";
4011 memset(&protocol_list, '\0', sizeof(struct objc_protocol_list_t));
4012 memcpy(&protocol_list, r, left);
4014 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4015 swapStruct(protocol_list);
4017 print_indent(indent);
4018 outs() << " next " << format("0x%08" PRIx32, protocol_list.next)
4020 print_indent(indent);
4021 outs() << " count " << protocol_list.count << "\n";
4023 list = r + sizeof(struct objc_protocol_list_t);
4024 for (i = 0; i < protocol_list.count; i++) {
4025 if ((i + 1) * sizeof(uint32_t) > left) {
4026 outs() << "\t\t remaining list entries extend past the of the section\n";
4029 memcpy(&l, list + i * sizeof(uint32_t), sizeof(uint32_t));
4030 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4031 sys::swapByteOrder(l);
4033 print_indent(indent);
4034 outs() << " list[" << i << "] " << format("0x%08" PRIx32, l);
4035 if (print_protocol(l, indent, info))
4036 outs() << "(not in an __OBJC section)\n";
4041 static void print_ivar_list64_t(uint64_t p, struct DisassembleInfo *info) {
4042 struct ivar_list64_t il;
4045 uint32_t offset, xoffset, left, j;
4047 const char *name, *sym_name, *ivar_offset_p;
4048 uint64_t ivar_offset, n_value;
4050 r = get_pointer_64(p, offset, left, S, info);
4053 memset(&il, '\0', sizeof(struct ivar_list64_t));
4054 if (left < sizeof(struct ivar_list64_t)) {
4055 memcpy(&il, r, left);
4056 outs() << " (ivar_list_t entends past the end of the section)\n";
4058 memcpy(&il, r, sizeof(struct ivar_list64_t));
4059 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4061 outs() << " entsize " << il.entsize << "\n";
4062 outs() << " count " << il.count << "\n";
4064 p += sizeof(struct ivar_list64_t);
4065 offset += sizeof(struct ivar_list64_t);
4066 for (j = 0; j < il.count; j++) {
4067 r = get_pointer_64(p, offset, left, S, info);
4070 memset(&i, '\0', sizeof(struct ivar64_t));
4071 if (left < sizeof(struct ivar64_t)) {
4072 memcpy(&i, r, left);
4073 outs() << " (ivar_t entends past the end of the section)\n";
4075 memcpy(&i, r, sizeof(struct ivar64_t));
4076 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4079 outs() << "\t\t\t offset ";
4080 sym_name = get_symbol_64(offset + offsetof(struct ivar64_t, offset), S,
4081 info, n_value, i.offset);
4083 if (info->verbose && sym_name != nullptr)
4086 outs() << format("0x%" PRIx64, n_value);
4088 outs() << " + " << format("0x%" PRIx64, i.offset);
4090 outs() << format("0x%" PRIx64, i.offset);
4091 ivar_offset_p = get_pointer_64(i.offset + n_value, xoffset, left, xS, info);
4092 if (ivar_offset_p != nullptr && left >= sizeof(*ivar_offset_p)) {
4093 memcpy(&ivar_offset, ivar_offset_p, sizeof(ivar_offset));
4094 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4095 sys::swapByteOrder(ivar_offset);
4096 outs() << " " << ivar_offset << "\n";
4100 outs() << "\t\t\t name ";
4101 sym_name = get_symbol_64(offset + offsetof(struct ivar64_t, name), S, info,
4104 if (info->verbose && sym_name != nullptr)
4107 outs() << format("0x%" PRIx64, n_value);
4109 outs() << " + " << format("0x%" PRIx64, i.name);
4111 outs() << format("0x%" PRIx64, i.name);
4112 name = get_pointer_64(i.name + n_value, xoffset, left, xS, info);
4113 if (name != nullptr)
4114 outs() << format(" %.*s", left, name);
4117 outs() << "\t\t\t type ";
4118 sym_name = get_symbol_64(offset + offsetof(struct ivar64_t, type), S, info,
4120 name = get_pointer_64(i.type + n_value, xoffset, left, xS, info);
4122 if (info->verbose && sym_name != nullptr)
4125 outs() << format("0x%" PRIx64, n_value);
4127 outs() << " + " << format("0x%" PRIx64, i.type);
4129 outs() << format("0x%" PRIx64, i.type);
4130 if (name != nullptr)
4131 outs() << format(" %.*s", left, name);
4134 outs() << "\t\t\talignment " << i.alignment << "\n";
4135 outs() << "\t\t\t size " << i.size << "\n";
4137 p += sizeof(struct ivar64_t);
4138 offset += sizeof(struct ivar64_t);
4142 static void print_ivar_list32_t(uint32_t p, struct DisassembleInfo *info) {
4143 struct ivar_list32_t il;
4146 uint32_t offset, xoffset, left, j;
4148 const char *name, *ivar_offset_p;
4149 uint32_t ivar_offset;
4151 r = get_pointer_32(p, offset, left, S, info);
4154 memset(&il, '\0', sizeof(struct ivar_list32_t));
4155 if (left < sizeof(struct ivar_list32_t)) {
4156 memcpy(&il, r, left);
4157 outs() << " (ivar_list_t entends past the end of the section)\n";
4159 memcpy(&il, r, sizeof(struct ivar_list32_t));
4160 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4162 outs() << " entsize " << il.entsize << "\n";
4163 outs() << " count " << il.count << "\n";
4165 p += sizeof(struct ivar_list32_t);
4166 offset += sizeof(struct ivar_list32_t);
4167 for (j = 0; j < il.count; j++) {
4168 r = get_pointer_32(p, offset, left, S, info);
4171 memset(&i, '\0', sizeof(struct ivar32_t));
4172 if (left < sizeof(struct ivar32_t)) {
4173 memcpy(&i, r, left);
4174 outs() << " (ivar_t entends past the end of the section)\n";
4176 memcpy(&i, r, sizeof(struct ivar32_t));
4177 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4180 outs() << "\t\t\t offset " << format("0x%" PRIx32, i.offset);
4181 ivar_offset_p = get_pointer_32(i.offset, xoffset, left, xS, info);
4182 if (ivar_offset_p != nullptr && left >= sizeof(*ivar_offset_p)) {
4183 memcpy(&ivar_offset, ivar_offset_p, sizeof(ivar_offset));
4184 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4185 sys::swapByteOrder(ivar_offset);
4186 outs() << " " << ivar_offset << "\n";
4190 outs() << "\t\t\t name " << format("0x%" PRIx32, i.name);
4191 name = get_pointer_32(i.name, xoffset, left, xS, info);
4192 if (name != nullptr)
4193 outs() << format(" %.*s", left, name);
4196 outs() << "\t\t\t type " << format("0x%" PRIx32, i.type);
4197 name = get_pointer_32(i.type, xoffset, left, xS, info);
4198 if (name != nullptr)
4199 outs() << format(" %.*s", left, name);
4202 outs() << "\t\t\talignment " << i.alignment << "\n";
4203 outs() << "\t\t\t size " << i.size << "\n";
4205 p += sizeof(struct ivar32_t);
4206 offset += sizeof(struct ivar32_t);
4210 static void print_objc_property_list64(uint64_t p,
4211 struct DisassembleInfo *info) {
4212 struct objc_property_list64 opl;
4213 struct objc_property64 op;
4215 uint32_t offset, xoffset, left, j;
4217 const char *name, *sym_name;
4220 r = get_pointer_64(p, offset, left, S, info);
4223 memset(&opl, '\0', sizeof(struct objc_property_list64));
4224 if (left < sizeof(struct objc_property_list64)) {
4225 memcpy(&opl, r, left);
4226 outs() << " (objc_property_list entends past the end of the section)\n";
4228 memcpy(&opl, r, sizeof(struct objc_property_list64));
4229 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4231 outs() << " entsize " << opl.entsize << "\n";
4232 outs() << " count " << opl.count << "\n";
4234 p += sizeof(struct objc_property_list64);
4235 offset += sizeof(struct objc_property_list64);
4236 for (j = 0; j < opl.count; j++) {
4237 r = get_pointer_64(p, offset, left, S, info);
4240 memset(&op, '\0', sizeof(struct objc_property64));
4241 if (left < sizeof(struct objc_property64)) {
4242 memcpy(&op, r, left);
4243 outs() << " (objc_property entends past the end of the section)\n";
4245 memcpy(&op, r, sizeof(struct objc_property64));
4246 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4249 outs() << "\t\t\t name ";
4250 sym_name = get_symbol_64(offset + offsetof(struct objc_property64, name), S,
4251 info, n_value, op.name);
4253 if (info->verbose && sym_name != nullptr)
4256 outs() << format("0x%" PRIx64, n_value);
4258 outs() << " + " << format("0x%" PRIx64, op.name);
4260 outs() << format("0x%" PRIx64, op.name);
4261 name = get_pointer_64(op.name + n_value, xoffset, left, xS, info);
4262 if (name != nullptr)
4263 outs() << format(" %.*s", left, name);
4266 outs() << "\t\t\tattributes ";
4268 get_symbol_64(offset + offsetof(struct objc_property64, attributes), S,
4269 info, n_value, op.attributes);
4271 if (info->verbose && sym_name != nullptr)
4274 outs() << format("0x%" PRIx64, n_value);
4275 if (op.attributes != 0)
4276 outs() << " + " << format("0x%" PRIx64, op.attributes);
4278 outs() << format("0x%" PRIx64, op.attributes);
4279 name = get_pointer_64(op.attributes + n_value, xoffset, left, xS, info);
4280 if (name != nullptr)
4281 outs() << format(" %.*s", left, name);
4284 p += sizeof(struct objc_property64);
4285 offset += sizeof(struct objc_property64);
4289 static void print_objc_property_list32(uint32_t p,
4290 struct DisassembleInfo *info) {
4291 struct objc_property_list32 opl;
4292 struct objc_property32 op;
4294 uint32_t offset, xoffset, left, j;
4298 r = get_pointer_32(p, offset, left, S, info);
4301 memset(&opl, '\0', sizeof(struct objc_property_list32));
4302 if (left < sizeof(struct objc_property_list32)) {
4303 memcpy(&opl, r, left);
4304 outs() << " (objc_property_list entends past the end of the section)\n";
4306 memcpy(&opl, r, sizeof(struct objc_property_list32));
4307 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4309 outs() << " entsize " << opl.entsize << "\n";
4310 outs() << " count " << opl.count << "\n";
4312 p += sizeof(struct objc_property_list32);
4313 offset += sizeof(struct objc_property_list32);
4314 for (j = 0; j < opl.count; j++) {
4315 r = get_pointer_32(p, offset, left, S, info);
4318 memset(&op, '\0', sizeof(struct objc_property32));
4319 if (left < sizeof(struct objc_property32)) {
4320 memcpy(&op, r, left);
4321 outs() << " (objc_property entends past the end of the section)\n";
4323 memcpy(&op, r, sizeof(struct objc_property32));
4324 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4327 outs() << "\t\t\t name " << format("0x%" PRIx32, op.name);
4328 name = get_pointer_32(op.name, xoffset, left, xS, info);
4329 if (name != nullptr)
4330 outs() << format(" %.*s", left, name);
4333 outs() << "\t\t\tattributes " << format("0x%" PRIx32, op.attributes);
4334 name = get_pointer_32(op.attributes, xoffset, left, xS, info);
4335 if (name != nullptr)
4336 outs() << format(" %.*s", left, name);
4339 p += sizeof(struct objc_property32);
4340 offset += sizeof(struct objc_property32);
4344 static bool print_class_ro64_t(uint64_t p, struct DisassembleInfo *info,
4345 bool &is_meta_class) {
4346 struct class_ro64_t cro;
4348 uint32_t offset, xoffset, left;
4350 const char *name, *sym_name;
4353 r = get_pointer_64(p, offset, left, S, info);
4354 if (r == nullptr || left < sizeof(struct class_ro64_t))
4356 memcpy(&cro, r, sizeof(struct class_ro64_t));
4357 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4359 outs() << " flags " << format("0x%" PRIx32, cro.flags);
4360 if (cro.flags & RO_META)
4361 outs() << " RO_META";
4362 if (cro.flags & RO_ROOT)
4363 outs() << " RO_ROOT";
4364 if (cro.flags & RO_HAS_CXX_STRUCTORS)
4365 outs() << " RO_HAS_CXX_STRUCTORS";
4367 outs() << " instanceStart " << cro.instanceStart << "\n";
4368 outs() << " instanceSize " << cro.instanceSize << "\n";
4369 outs() << " reserved " << format("0x%" PRIx32, cro.reserved)
4371 outs() << " ivarLayout " << format("0x%" PRIx64, cro.ivarLayout)
4373 print_layout_map64(cro.ivarLayout, info);
4376 sym_name = get_symbol_64(offset + offsetof(struct class_ro64_t, name), S,
4377 info, n_value, cro.name);
4379 if (info->verbose && sym_name != nullptr)
4382 outs() << format("0x%" PRIx64, n_value);
4384 outs() << " + " << format("0x%" PRIx64, cro.name);
4386 outs() << format("0x%" PRIx64, cro.name);
4387 name = get_pointer_64(cro.name + n_value, xoffset, left, xS, info);
4388 if (name != nullptr)
4389 outs() << format(" %.*s", left, name);
4392 outs() << " baseMethods ";
4393 sym_name = get_symbol_64(offset + offsetof(struct class_ro64_t, baseMethods),
4394 S, info, n_value, cro.baseMethods);
4396 if (info->verbose && sym_name != nullptr)
4399 outs() << format("0x%" PRIx64, n_value);
4400 if (cro.baseMethods != 0)
4401 outs() << " + " << format("0x%" PRIx64, cro.baseMethods);
4403 outs() << format("0x%" PRIx64, cro.baseMethods);
4404 outs() << " (struct method_list_t *)\n";
4405 if (cro.baseMethods + n_value != 0)
4406 print_method_list64_t(cro.baseMethods + n_value, info, "");
4408 outs() << " baseProtocols ";
4410 get_symbol_64(offset + offsetof(struct class_ro64_t, baseProtocols), S,
4411 info, n_value, cro.baseProtocols);
4413 if (info->verbose && sym_name != nullptr)
4416 outs() << format("0x%" PRIx64, n_value);
4417 if (cro.baseProtocols != 0)
4418 outs() << " + " << format("0x%" PRIx64, cro.baseProtocols);
4420 outs() << format("0x%" PRIx64, cro.baseProtocols);
4422 if (cro.baseProtocols + n_value != 0)
4423 print_protocol_list64_t(cro.baseProtocols + n_value, info);
4425 outs() << " ivars ";
4426 sym_name = get_symbol_64(offset + offsetof(struct class_ro64_t, ivars), S,
4427 info, n_value, cro.ivars);
4429 if (info->verbose && sym_name != nullptr)
4432 outs() << format("0x%" PRIx64, n_value);
4434 outs() << " + " << format("0x%" PRIx64, cro.ivars);
4436 outs() << format("0x%" PRIx64, cro.ivars);
4438 if (cro.ivars + n_value != 0)
4439 print_ivar_list64_t(cro.ivars + n_value, info);
4441 outs() << " weakIvarLayout ";
4443 get_symbol_64(offset + offsetof(struct class_ro64_t, weakIvarLayout), S,
4444 info, n_value, cro.weakIvarLayout);
4446 if (info->verbose && sym_name != nullptr)
4449 outs() << format("0x%" PRIx64, n_value);
4450 if (cro.weakIvarLayout != 0)
4451 outs() << " + " << format("0x%" PRIx64, cro.weakIvarLayout);
4453 outs() << format("0x%" PRIx64, cro.weakIvarLayout);
4455 print_layout_map64(cro.weakIvarLayout + n_value, info);
4457 outs() << " baseProperties ";
4459 get_symbol_64(offset + offsetof(struct class_ro64_t, baseProperties), S,
4460 info, n_value, cro.baseProperties);
4462 if (info->verbose && sym_name != nullptr)
4465 outs() << format("0x%" PRIx64, n_value);
4466 if (cro.baseProperties != 0)
4467 outs() << " + " << format("0x%" PRIx64, cro.baseProperties);
4469 outs() << format("0x%" PRIx64, cro.baseProperties);
4471 if (cro.baseProperties + n_value != 0)
4472 print_objc_property_list64(cro.baseProperties + n_value, info);
4474 is_meta_class = (cro.flags & RO_META) != 0;
4478 static bool print_class_ro32_t(uint32_t p, struct DisassembleInfo *info,
4479 bool &is_meta_class) {
4480 struct class_ro32_t cro;
4482 uint32_t offset, xoffset, left;
4486 r = get_pointer_32(p, offset, left, S, info);
4489 memset(&cro, '\0', sizeof(struct class_ro32_t));
4490 if (left < sizeof(struct class_ro32_t)) {
4491 memcpy(&cro, r, left);
4492 outs() << " (class_ro_t entends past the end of the section)\n";
4494 memcpy(&cro, r, sizeof(struct class_ro32_t));
4495 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4497 outs() << " flags " << format("0x%" PRIx32, cro.flags);
4498 if (cro.flags & RO_META)
4499 outs() << " RO_META";
4500 if (cro.flags & RO_ROOT)
4501 outs() << " RO_ROOT";
4502 if (cro.flags & RO_HAS_CXX_STRUCTORS)
4503 outs() << " RO_HAS_CXX_STRUCTORS";
4505 outs() << " instanceStart " << cro.instanceStart << "\n";
4506 outs() << " instanceSize " << cro.instanceSize << "\n";
4507 outs() << " ivarLayout " << format("0x%" PRIx32, cro.ivarLayout)
4509 print_layout_map32(cro.ivarLayout, info);
4511 outs() << " name " << format("0x%" PRIx32, cro.name);
4512 name = get_pointer_32(cro.name, xoffset, left, xS, info);
4513 if (name != nullptr)
4514 outs() << format(" %.*s", left, name);
4517 outs() << " baseMethods "
4518 << format("0x%" PRIx32, cro.baseMethods)
4519 << " (struct method_list_t *)\n";
4520 if (cro.baseMethods != 0)
4521 print_method_list32_t(cro.baseMethods, info, "");
4523 outs() << " baseProtocols "
4524 << format("0x%" PRIx32, cro.baseProtocols) << "\n";
4525 if (cro.baseProtocols != 0)
4526 print_protocol_list32_t(cro.baseProtocols, info);
4527 outs() << " ivars " << format("0x%" PRIx32, cro.ivars)
4530 print_ivar_list32_t(cro.ivars, info);
4531 outs() << " weakIvarLayout "
4532 << format("0x%" PRIx32, cro.weakIvarLayout) << "\n";
4533 print_layout_map32(cro.weakIvarLayout, info);
4534 outs() << " baseProperties "
4535 << format("0x%" PRIx32, cro.baseProperties) << "\n";
4536 if (cro.baseProperties != 0)
4537 print_objc_property_list32(cro.baseProperties, info);
4538 is_meta_class = (cro.flags & RO_META) != 0;
4542 static void print_class64_t(uint64_t p, struct DisassembleInfo *info) {
4545 uint32_t offset, left;
4548 uint64_t isa_n_value, n_value;
4550 r = get_pointer_64(p, offset, left, S, info);
4551 if (r == nullptr || left < sizeof(struct class64_t))
4553 memcpy(&c, r, sizeof(struct class64_t));
4554 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4557 outs() << " isa " << format("0x%" PRIx64, c.isa);
4558 name = get_symbol_64(offset + offsetof(struct class64_t, isa), S, info,
4559 isa_n_value, c.isa);
4560 if (name != nullptr)
4561 outs() << " " << name;
4564 outs() << " superclass " << format("0x%" PRIx64, c.superclass);
4565 name = get_symbol_64(offset + offsetof(struct class64_t, superclass), S, info,
4566 n_value, c.superclass);
4567 if (name != nullptr)
4568 outs() << " " << name;
4571 outs() << " cache " << format("0x%" PRIx64, c.cache);
4572 name = get_symbol_64(offset + offsetof(struct class64_t, cache), S, info,
4574 if (name != nullptr)
4575 outs() << " " << name;
4578 outs() << " vtable " << format("0x%" PRIx64, c.vtable);
4579 name = get_symbol_64(offset + offsetof(struct class64_t, vtable), S, info,
4581 if (name != nullptr)
4582 outs() << " " << name;
4585 name = get_symbol_64(offset + offsetof(struct class64_t, data), S, info,
4589 if (info->verbose && name != nullptr)
4592 outs() << format("0x%" PRIx64, n_value);
4594 outs() << " + " << format("0x%" PRIx64, c.data);
4596 outs() << format("0x%" PRIx64, c.data);
4597 outs() << " (struct class_ro_t *)";
4599 // This is a Swift class if some of the low bits of the pointer are set.
4600 if ((c.data + n_value) & 0x7)
4601 outs() << " Swift class";
4604 if (!print_class_ro64_t((c.data + n_value) & ~0x7, info, is_meta_class))
4607 if (!is_meta_class &&
4608 c.isa + isa_n_value != p &&
4609 c.isa + isa_n_value != 0 &&
4610 info->depth < 100) {
4612 outs() << "Meta Class\n";
4613 print_class64_t(c.isa + isa_n_value, info);
4617 static void print_class32_t(uint32_t p, struct DisassembleInfo *info) {
4620 uint32_t offset, left;
4624 r = get_pointer_32(p, offset, left, S, info);
4627 memset(&c, '\0', sizeof(struct class32_t));
4628 if (left < sizeof(struct class32_t)) {
4629 memcpy(&c, r, left);
4630 outs() << " (class_t entends past the end of the section)\n";
4632 memcpy(&c, r, sizeof(struct class32_t));
4633 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4636 outs() << " isa " << format("0x%" PRIx32, c.isa);
4638 get_symbol_32(offset + offsetof(struct class32_t, isa), S, info, c.isa);
4639 if (name != nullptr)
4640 outs() << " " << name;
4643 outs() << " superclass " << format("0x%" PRIx32, c.superclass);
4644 name = get_symbol_32(offset + offsetof(struct class32_t, superclass), S, info,
4646 if (name != nullptr)
4647 outs() << " " << name;
4650 outs() << " cache " << format("0x%" PRIx32, c.cache);
4651 name = get_symbol_32(offset + offsetof(struct class32_t, cache), S, info,
4653 if (name != nullptr)
4654 outs() << " " << name;
4657 outs() << " vtable " << format("0x%" PRIx32, c.vtable);
4658 name = get_symbol_32(offset + offsetof(struct class32_t, vtable), S, info,
4660 if (name != nullptr)
4661 outs() << " " << name;
4665 get_symbol_32(offset + offsetof(struct class32_t, data), S, info, c.data);
4666 outs() << " data " << format("0x%" PRIx32, c.data)
4667 << " (struct class_ro_t *)";
4669 // This is a Swift class if some of the low bits of the pointer are set.
4671 outs() << " Swift class";
4674 if (!print_class_ro32_t(c.data & ~0x3, info, is_meta_class))
4677 if (!is_meta_class) {
4678 outs() << "Meta Class\n";
4679 print_class32_t(c.isa, info);
4683 static void print_objc_class_t(struct objc_class_t *objc_class,
4684 struct DisassembleInfo *info) {
4685 uint32_t offset, left, xleft;
4686 const char *name, *p, *ivar_list;
4689 struct objc_ivar_list_t objc_ivar_list;
4690 struct objc_ivar_t ivar;
4692 outs() << "\t\t isa " << format("0x%08" PRIx32, objc_class->isa);
4693 if (info->verbose && CLS_GETINFO(objc_class, CLS_META)) {
4694 name = get_pointer_32(objc_class->isa, offset, left, S, info, true);
4695 if (name != nullptr)
4696 outs() << format(" %.*s", left, name);
4698 outs() << " (not in an __OBJC section)";
4702 outs() << "\t super_class "
4703 << format("0x%08" PRIx32, objc_class->super_class);
4704 if (info->verbose) {
4705 name = get_pointer_32(objc_class->super_class, offset, left, S, info, true);
4706 if (name != nullptr)
4707 outs() << format(" %.*s", left, name);
4709 outs() << " (not in an __OBJC section)";
4713 outs() << "\t\t name " << format("0x%08" PRIx32, objc_class->name);
4714 if (info->verbose) {
4715 name = get_pointer_32(objc_class->name, offset, left, S, info, true);
4716 if (name != nullptr)
4717 outs() << format(" %.*s", left, name);
4719 outs() << " (not in an __OBJC section)";
4723 outs() << "\t\t version " << format("0x%08" PRIx32, objc_class->version)
4726 outs() << "\t\t info " << format("0x%08" PRIx32, objc_class->info);
4727 if (info->verbose) {
4728 if (CLS_GETINFO(objc_class, CLS_CLASS))
4729 outs() << " CLS_CLASS";
4730 else if (CLS_GETINFO(objc_class, CLS_META))
4731 outs() << " CLS_META";
4735 outs() << "\t instance_size "
4736 << format("0x%08" PRIx32, objc_class->instance_size) << "\n";
4738 p = get_pointer_32(objc_class->ivars, offset, left, S, info, true);
4739 outs() << "\t\t ivars " << format("0x%08" PRIx32, objc_class->ivars);
4741 if (left > sizeof(struct objc_ivar_list_t)) {
4743 memcpy(&objc_ivar_list, p, sizeof(struct objc_ivar_list_t));
4745 outs() << " (entends past the end of the section)\n";
4746 memset(&objc_ivar_list, '\0', sizeof(struct objc_ivar_list_t));
4747 memcpy(&objc_ivar_list, p, left);
4749 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4750 swapStruct(objc_ivar_list);
4751 outs() << "\t\t ivar_count " << objc_ivar_list.ivar_count << "\n";
4752 ivar_list = p + sizeof(struct objc_ivar_list_t);
4753 for (i = 0; i < objc_ivar_list.ivar_count; i++) {
4754 if ((i + 1) * sizeof(struct objc_ivar_t) > left) {
4755 outs() << "\t\t remaining ivar's extend past the of the section\n";
4758 memcpy(&ivar, ivar_list + i * sizeof(struct objc_ivar_t),
4759 sizeof(struct objc_ivar_t));
4760 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4763 outs() << "\t\t\tivar_name " << format("0x%08" PRIx32, ivar.ivar_name);
4764 if (info->verbose) {
4765 name = get_pointer_32(ivar.ivar_name, offset, xleft, S, info, true);
4766 if (name != nullptr)
4767 outs() << format(" %.*s", xleft, name);
4769 outs() << " (not in an __OBJC section)";
4773 outs() << "\t\t\tivar_type " << format("0x%08" PRIx32, ivar.ivar_type);
4774 if (info->verbose) {
4775 name = get_pointer_32(ivar.ivar_type, offset, xleft, S, info, true);
4776 if (name != nullptr)
4777 outs() << format(" %.*s", xleft, name);
4779 outs() << " (not in an __OBJC section)";
4783 outs() << "\t\t ivar_offset "
4784 << format("0x%08" PRIx32, ivar.ivar_offset) << "\n";
4787 outs() << " (not in an __OBJC section)\n";
4790 outs() << "\t\t methods " << format("0x%08" PRIx32, objc_class->methodLists);
4791 if (print_method_list(objc_class->methodLists, info))
4792 outs() << " (not in an __OBJC section)\n";
4794 outs() << "\t\t cache " << format("0x%08" PRIx32, objc_class->cache)
4797 outs() << "\t\tprotocols " << format("0x%08" PRIx32, objc_class->protocols);
4798 if (print_protocol_list(objc_class->protocols, 16, info))
4799 outs() << " (not in an __OBJC section)\n";
4802 static void print_objc_objc_category_t(struct objc_category_t *objc_category,
4803 struct DisassembleInfo *info) {
4804 uint32_t offset, left;
4808 outs() << "\t category name "
4809 << format("0x%08" PRIx32, objc_category->category_name);
4810 if (info->verbose) {
4811 name = get_pointer_32(objc_category->category_name, offset, left, S, info,
4813 if (name != nullptr)
4814 outs() << format(" %.*s", left, name);
4816 outs() << " (not in an __OBJC section)";
4820 outs() << "\t\t class name "
4821 << format("0x%08" PRIx32, objc_category->class_name);
4822 if (info->verbose) {
4824 get_pointer_32(objc_category->class_name, offset, left, S, info, true);
4825 if (name != nullptr)
4826 outs() << format(" %.*s", left, name);
4828 outs() << " (not in an __OBJC section)";
4832 outs() << "\t instance methods "
4833 << format("0x%08" PRIx32, objc_category->instance_methods);
4834 if (print_method_list(objc_category->instance_methods, info))
4835 outs() << " (not in an __OBJC section)\n";
4837 outs() << "\t class methods "
4838 << format("0x%08" PRIx32, objc_category->class_methods);
4839 if (print_method_list(objc_category->class_methods, info))
4840 outs() << " (not in an __OBJC section)\n";
4843 static void print_category64_t(uint64_t p, struct DisassembleInfo *info) {
4844 struct category64_t c;
4846 uint32_t offset, xoffset, left;
4848 const char *name, *sym_name;
4851 r = get_pointer_64(p, offset, left, S, info);
4854 memset(&c, '\0', sizeof(struct category64_t));
4855 if (left < sizeof(struct category64_t)) {
4856 memcpy(&c, r, left);
4857 outs() << " (category_t entends past the end of the section)\n";
4859 memcpy(&c, r, sizeof(struct category64_t));
4860 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4864 sym_name = get_symbol_64(offset + offsetof(struct category64_t, name), S,
4865 info, n_value, c.name);
4867 if (info->verbose && sym_name != nullptr)
4870 outs() << format("0x%" PRIx64, n_value);
4872 outs() << " + " << format("0x%" PRIx64, c.name);
4874 outs() << format("0x%" PRIx64, c.name);
4875 name = get_pointer_64(c.name + n_value, xoffset, left, xS, info);
4876 if (name != nullptr)
4877 outs() << format(" %.*s", left, name);
4881 sym_name = get_symbol_64(offset + offsetof(struct category64_t, cls), S, info,
4884 if (info->verbose && sym_name != nullptr)
4887 outs() << format("0x%" PRIx64, n_value);
4889 outs() << " + " << format("0x%" PRIx64, c.cls);
4891 outs() << format("0x%" PRIx64, c.cls);
4893 if (c.cls + n_value != 0)
4894 print_class64_t(c.cls + n_value, info);
4896 outs() << " instanceMethods ";
4898 get_symbol_64(offset + offsetof(struct category64_t, instanceMethods), S,
4899 info, n_value, c.instanceMethods);
4901 if (info->verbose && sym_name != nullptr)
4904 outs() << format("0x%" PRIx64, n_value);
4905 if (c.instanceMethods != 0)
4906 outs() << " + " << format("0x%" PRIx64, c.instanceMethods);
4908 outs() << format("0x%" PRIx64, c.instanceMethods);
4910 if (c.instanceMethods + n_value != 0)
4911 print_method_list64_t(c.instanceMethods + n_value, info, "");
4913 outs() << " classMethods ";
4914 sym_name = get_symbol_64(offset + offsetof(struct category64_t, classMethods),
4915 S, info, n_value, c.classMethods);
4917 if (info->verbose && sym_name != nullptr)
4920 outs() << format("0x%" PRIx64, n_value);
4921 if (c.classMethods != 0)
4922 outs() << " + " << format("0x%" PRIx64, c.classMethods);
4924 outs() << format("0x%" PRIx64, c.classMethods);
4926 if (c.classMethods + n_value != 0)
4927 print_method_list64_t(c.classMethods + n_value, info, "");
4929 outs() << " protocols ";
4930 sym_name = get_symbol_64(offset + offsetof(struct category64_t, protocols), S,
4931 info, n_value, c.protocols);
4933 if (info->verbose && sym_name != nullptr)
4936 outs() << format("0x%" PRIx64, n_value);
4937 if (c.protocols != 0)
4938 outs() << " + " << format("0x%" PRIx64, c.protocols);
4940 outs() << format("0x%" PRIx64, c.protocols);
4942 if (c.protocols + n_value != 0)
4943 print_protocol_list64_t(c.protocols + n_value, info);
4945 outs() << "instanceProperties ";
4947 get_symbol_64(offset + offsetof(struct category64_t, instanceProperties),
4948 S, info, n_value, c.instanceProperties);
4950 if (info->verbose && sym_name != nullptr)
4953 outs() << format("0x%" PRIx64, n_value);
4954 if (c.instanceProperties != 0)
4955 outs() << " + " << format("0x%" PRIx64, c.instanceProperties);
4957 outs() << format("0x%" PRIx64, c.instanceProperties);
4959 if (c.instanceProperties + n_value != 0)
4960 print_objc_property_list64(c.instanceProperties + n_value, info);
4963 static void print_category32_t(uint32_t p, struct DisassembleInfo *info) {
4964 struct category32_t c;
4966 uint32_t offset, left;
4970 r = get_pointer_32(p, offset, left, S, info);
4973 memset(&c, '\0', sizeof(struct category32_t));
4974 if (left < sizeof(struct category32_t)) {
4975 memcpy(&c, r, left);
4976 outs() << " (category_t entends past the end of the section)\n";
4978 memcpy(&c, r, sizeof(struct category32_t));
4979 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
4982 outs() << " name " << format("0x%" PRIx32, c.name);
4983 name = get_symbol_32(offset + offsetof(struct category32_t, name), S, info,
4986 outs() << " " << name;
4989 outs() << " cls " << format("0x%" PRIx32, c.cls) << "\n";
4991 print_class32_t(c.cls, info);
4992 outs() << " instanceMethods " << format("0x%" PRIx32, c.instanceMethods)
4994 if (c.instanceMethods != 0)
4995 print_method_list32_t(c.instanceMethods, info, "");
4996 outs() << " classMethods " << format("0x%" PRIx32, c.classMethods)
4998 if (c.classMethods != 0)
4999 print_method_list32_t(c.classMethods, info, "");
5000 outs() << " protocols " << format("0x%" PRIx32, c.protocols) << "\n";
5001 if (c.protocols != 0)
5002 print_protocol_list32_t(c.protocols, info);
5003 outs() << "instanceProperties " << format("0x%" PRIx32, c.instanceProperties)
5005 if (c.instanceProperties != 0)
5006 print_objc_property_list32(c.instanceProperties, info);
5009 static void print_message_refs64(SectionRef S, struct DisassembleInfo *info) {
5010 uint32_t i, left, offset, xoffset;
5011 uint64_t p, n_value;
5012 struct message_ref64 mr;
5013 const char *name, *sym_name;
5017 if (S == SectionRef())
5021 S.getName(SectName);
5022 DataRefImpl Ref = S.getRawDataRefImpl();
5023 StringRef SegName = info->O->getSectionFinalSegmentName(Ref);
5024 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
5026 for (i = 0; i < S.getSize(); i += sizeof(struct message_ref64)) {
5027 p = S.getAddress() + i;
5028 r = get_pointer_64(p, offset, left, S, info);
5031 memset(&mr, '\0', sizeof(struct message_ref64));
5032 if (left < sizeof(struct message_ref64)) {
5033 memcpy(&mr, r, left);
5034 outs() << " (message_ref entends past the end of the section)\n";
5036 memcpy(&mr, r, sizeof(struct message_ref64));
5037 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
5041 name = get_symbol_64(offset + offsetof(struct message_ref64, imp), S, info,
5044 outs() << format("0x%" PRIx64, n_value) << " ";
5046 outs() << "+ " << format("0x%" PRIx64, mr.imp) << " ";
5048 outs() << format("0x%" PRIx64, mr.imp) << " ";
5049 if (name != nullptr)
5050 outs() << " " << name;
5054 sym_name = get_symbol_64(offset + offsetof(struct message_ref64, sel), S,
5055 info, n_value, mr.sel);
5057 if (info->verbose && sym_name != nullptr)
5060 outs() << format("0x%" PRIx64, n_value);
5062 outs() << " + " << format("0x%" PRIx64, mr.sel);
5064 outs() << format("0x%" PRIx64, mr.sel);
5065 name = get_pointer_64(mr.sel + n_value, xoffset, left, xS, info);
5066 if (name != nullptr)
5067 outs() << format(" %.*s", left, name);
5070 offset += sizeof(struct message_ref64);
5074 static void print_message_refs32(SectionRef S, struct DisassembleInfo *info) {
5075 uint32_t i, left, offset, xoffset, p;
5076 struct message_ref32 mr;
5077 const char *name, *r;
5080 if (S == SectionRef())
5084 S.getName(SectName);
5085 DataRefImpl Ref = S.getRawDataRefImpl();
5086 StringRef SegName = info->O->getSectionFinalSegmentName(Ref);
5087 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
5089 for (i = 0; i < S.getSize(); i += sizeof(struct message_ref64)) {
5090 p = S.getAddress() + i;
5091 r = get_pointer_32(p, offset, left, S, info);
5094 memset(&mr, '\0', sizeof(struct message_ref32));
5095 if (left < sizeof(struct message_ref32)) {
5096 memcpy(&mr, r, left);
5097 outs() << " (message_ref entends past the end of the section)\n";
5099 memcpy(&mr, r, sizeof(struct message_ref32));
5100 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
5103 outs() << " imp " << format("0x%" PRIx32, mr.imp);
5104 name = get_symbol_32(offset + offsetof(struct message_ref32, imp), S, info,
5106 if (name != nullptr)
5107 outs() << " " << name;
5110 outs() << " sel " << format("0x%" PRIx32, mr.sel);
5111 name = get_pointer_32(mr.sel, xoffset, left, xS, info);
5112 if (name != nullptr)
5113 outs() << " " << name;
5116 offset += sizeof(struct message_ref32);
5120 static void print_image_info64(SectionRef S, struct DisassembleInfo *info) {
5121 uint32_t left, offset, swift_version;
5123 struct objc_image_info64 o;
5126 if (S == SectionRef())
5130 S.getName(SectName);
5131 DataRefImpl Ref = S.getRawDataRefImpl();
5132 StringRef SegName = info->O->getSectionFinalSegmentName(Ref);
5133 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
5135 r = get_pointer_64(p, offset, left, S, info);
5138 memset(&o, '\0', sizeof(struct objc_image_info64));
5139 if (left < sizeof(struct objc_image_info64)) {
5140 memcpy(&o, r, left);
5141 outs() << " (objc_image_info entends past the end of the section)\n";
5143 memcpy(&o, r, sizeof(struct objc_image_info64));
5144 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
5146 outs() << " version " << o.version << "\n";
5147 outs() << " flags " << format("0x%" PRIx32, o.flags);
5148 if (o.flags & OBJC_IMAGE_IS_REPLACEMENT)
5149 outs() << " OBJC_IMAGE_IS_REPLACEMENT";
5150 if (o.flags & OBJC_IMAGE_SUPPORTS_GC)
5151 outs() << " OBJC_IMAGE_SUPPORTS_GC";
5152 swift_version = (o.flags >> 8) & 0xff;
5153 if (swift_version != 0) {
5154 if (swift_version == 1)
5155 outs() << " Swift 1.0";
5156 else if (swift_version == 2)
5157 outs() << " Swift 1.1";
5159 outs() << " unknown future Swift version (" << swift_version << ")";
5164 static void print_image_info32(SectionRef S, struct DisassembleInfo *info) {
5165 uint32_t left, offset, swift_version, p;
5166 struct objc_image_info32 o;
5169 if (S == SectionRef())
5173 S.getName(SectName);
5174 DataRefImpl Ref = S.getRawDataRefImpl();
5175 StringRef SegName = info->O->getSectionFinalSegmentName(Ref);
5176 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
5178 r = get_pointer_32(p, offset, left, S, info);
5181 memset(&o, '\0', sizeof(struct objc_image_info32));
5182 if (left < sizeof(struct objc_image_info32)) {
5183 memcpy(&o, r, left);
5184 outs() << " (objc_image_info entends past the end of the section)\n";
5186 memcpy(&o, r, sizeof(struct objc_image_info32));
5187 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
5189 outs() << " version " << o.version << "\n";
5190 outs() << " flags " << format("0x%" PRIx32, o.flags);
5191 if (o.flags & OBJC_IMAGE_IS_REPLACEMENT)
5192 outs() << " OBJC_IMAGE_IS_REPLACEMENT";
5193 if (o.flags & OBJC_IMAGE_SUPPORTS_GC)
5194 outs() << " OBJC_IMAGE_SUPPORTS_GC";
5195 swift_version = (o.flags >> 8) & 0xff;
5196 if (swift_version != 0) {
5197 if (swift_version == 1)
5198 outs() << " Swift 1.0";
5199 else if (swift_version == 2)
5200 outs() << " Swift 1.1";
5202 outs() << " unknown future Swift version (" << swift_version << ")";
5207 static void print_image_info(SectionRef S, struct DisassembleInfo *info) {
5208 uint32_t left, offset, p;
5209 struct imageInfo_t o;
5213 S.getName(SectName);
5214 DataRefImpl Ref = S.getRawDataRefImpl();
5215 StringRef SegName = info->O->getSectionFinalSegmentName(Ref);
5216 outs() << "Contents of (" << SegName << "," << SectName << ") section\n";
5218 r = get_pointer_32(p, offset, left, S, info);
5221 memset(&o, '\0', sizeof(struct imageInfo_t));
5222 if (left < sizeof(struct imageInfo_t)) {
5223 memcpy(&o, r, left);
5224 outs() << " (imageInfo entends past the end of the section)\n";
5226 memcpy(&o, r, sizeof(struct imageInfo_t));
5227 if (info->O->isLittleEndian() != sys::IsLittleEndianHost)
5229 outs() << " version " << o.version << "\n";
5230 outs() << " flags " << format("0x%" PRIx32, o.flags);
5236 outs() << " GC-only";
5242 static void printObjc2_64bit_MetaData(MachOObjectFile *O, bool verbose) {
5243 SymbolAddressMap AddrMap;
5245 CreateSymbolAddressMap(O, &AddrMap);
5247 std::vector<SectionRef> Sections;
5248 for (const SectionRef &Section : O->sections()) {
5250 Section.getName(SectName);
5251 Sections.push_back(Section);
5254 struct DisassembleInfo info;
5255 // Set up the block of info used by the Symbolizer call backs.
5256 info.verbose = verbose;
5258 info.AddrMap = &AddrMap;
5259 info.Sections = &Sections;
5260 info.class_name = nullptr;
5261 info.selector_name = nullptr;
5262 info.method = nullptr;
5263 info.demangled_name = nullptr;
5264 info.bindtable = nullptr;
5269 SectionRef CL = get_section(O, "__OBJC2", "__class_list");
5270 if (CL == SectionRef())
5271 CL = get_section(O, "__DATA", "__objc_classlist");
5273 walk_pointer_list_64("class", CL, O, &info, print_class64_t);
5275 SectionRef CR = get_section(O, "__OBJC2", "__class_refs");
5276 if (CR == SectionRef())
5277 CR = get_section(O, "__DATA", "__objc_classrefs");
5279 walk_pointer_list_64("class refs", CR, O, &info, nullptr);
5281 SectionRef SR = get_section(O, "__OBJC2", "__super_refs");
5282 if (SR == SectionRef())
5283 SR = get_section(O, "__DATA", "__objc_superrefs");
5285 walk_pointer_list_64("super refs", SR, O, &info, nullptr);
5287 SectionRef CA = get_section(O, "__OBJC2", "__category_list");
5288 if (CA == SectionRef())
5289 CA = get_section(O, "__DATA", "__objc_catlist");
5291 walk_pointer_list_64("category", CA, O, &info, print_category64_t);
5293 SectionRef PL = get_section(O, "__OBJC2", "__protocol_list");
5294 if (PL == SectionRef())
5295 PL = get_section(O, "__DATA", "__objc_protolist");
5297 walk_pointer_list_64("protocol", PL, O, &info, nullptr);
5299 SectionRef MR = get_section(O, "__OBJC2", "__message_refs");
5300 if (MR == SectionRef())
5301 MR = get_section(O, "__DATA", "__objc_msgrefs");
5303 print_message_refs64(MR, &info);
5305 SectionRef II = get_section(O, "__OBJC2", "__image_info");
5306 if (II == SectionRef())
5307 II = get_section(O, "__DATA", "__objc_imageinfo");
5309 print_image_info64(II, &info);
5312 static void printObjc2_32bit_MetaData(MachOObjectFile *O, bool verbose) {
5313 SymbolAddressMap AddrMap;
5315 CreateSymbolAddressMap(O, &AddrMap);
5317 std::vector<SectionRef> Sections;
5318 for (const SectionRef &Section : O->sections()) {
5320 Section.getName(SectName);
5321 Sections.push_back(Section);
5324 struct DisassembleInfo info;
5325 // Set up the block of info used by the Symbolizer call backs.
5326 info.verbose = verbose;
5328 info.AddrMap = &AddrMap;
5329 info.Sections = &Sections;
5330 info.class_name = nullptr;
5331 info.selector_name = nullptr;
5332 info.method = nullptr;
5333 info.demangled_name = nullptr;
5334 info.bindtable = nullptr;
5338 const SectionRef CL = get_section(O, "__OBJC2", "__class_list");
5339 if (CL != SectionRef()) {
5341 walk_pointer_list_32("class", CL, O, &info, print_class32_t);
5343 const SectionRef CL = get_section(O, "__DATA", "__objc_classlist");
5345 walk_pointer_list_32("class", CL, O, &info, print_class32_t);
5348 const SectionRef CR = get_section(O, "__OBJC2", "__class_refs");
5349 if (CR != SectionRef()) {
5351 walk_pointer_list_32("class refs", CR, O, &info, nullptr);
5353 const SectionRef CR = get_section(O, "__DATA", "__objc_classrefs");
5355 walk_pointer_list_32("class refs", CR, O, &info, nullptr);
5358 const SectionRef SR = get_section(O, "__OBJC2", "__super_refs");
5359 if (SR != SectionRef()) {
5361 walk_pointer_list_32("super refs", SR, O, &info, nullptr);
5363 const SectionRef SR = get_section(O, "__DATA", "__objc_superrefs");
5365 walk_pointer_list_32("super refs", SR, O, &info, nullptr);
5368 const SectionRef CA = get_section(O, "__OBJC2", "__category_list");
5369 if (CA != SectionRef()) {
5371 walk_pointer_list_32("category", CA, O, &info, print_category32_t);
5373 const SectionRef CA = get_section(O, "__DATA", "__objc_catlist");
5375 walk_pointer_list_32("category", CA, O, &info, print_category32_t);
5378 const SectionRef PL = get_section(O, "__OBJC2", "__protocol_list");
5379 if (PL != SectionRef()) {
5381 walk_pointer_list_32("protocol", PL, O, &info, nullptr);
5383 const SectionRef PL = get_section(O, "__DATA", "__objc_protolist");
5385 walk_pointer_list_32("protocol", PL, O, &info, nullptr);
5388 const SectionRef MR = get_section(O, "__OBJC2", "__message_refs");
5389 if (MR != SectionRef()) {
5391 print_message_refs32(MR, &info);
5393 const SectionRef MR = get_section(O, "__DATA", "__objc_msgrefs");
5395 print_message_refs32(MR, &info);
5398 const SectionRef II = get_section(O, "__OBJC2", "__image_info");
5399 if (II != SectionRef()) {
5401 print_image_info32(II, &info);
5403 const SectionRef II = get_section(O, "__DATA", "__objc_imageinfo");
5405 print_image_info32(II, &info);
5409 static bool printObjc1_32bit_MetaData(MachOObjectFile *O, bool verbose) {
5410 uint32_t i, j, p, offset, xoffset, left, defs_left, def;
5411 const char *r, *name, *defs;
5412 struct objc_module_t module;
5414 struct objc_symtab_t symtab;
5415 struct objc_class_t objc_class;
5416 struct objc_category_t objc_category;
5418 outs() << "Objective-C segment\n";
5419 S = get_section(O, "__OBJC", "__module_info");
5420 if (S == SectionRef())
5423 SymbolAddressMap AddrMap;
5425 CreateSymbolAddressMap(O, &AddrMap);
5427 std::vector<SectionRef> Sections;
5428 for (const SectionRef &Section : O->sections()) {
5430 Section.getName(SectName);
5431 Sections.push_back(Section);
5434 struct DisassembleInfo info;
5435 // Set up the block of info used by the Symbolizer call backs.
5436 info.verbose = verbose;
5438 info.AddrMap = &AddrMap;
5439 info.Sections = &Sections;
5440 info.class_name = nullptr;
5441 info.selector_name = nullptr;
5442 info.method = nullptr;
5443 info.demangled_name = nullptr;
5444 info.bindtable = nullptr;
5448 for (i = 0; i < S.getSize(); i += sizeof(struct objc_module_t)) {
5449 p = S.getAddress() + i;
5450 r = get_pointer_32(p, offset, left, S, &info, true);
5453 memset(&module, '\0', sizeof(struct objc_module_t));
5454 if (left < sizeof(struct objc_module_t)) {
5455 memcpy(&module, r, left);
5456 outs() << " (module extends past end of __module_info section)\n";
5458 memcpy(&module, r, sizeof(struct objc_module_t));
5459 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5462 outs() << "Module " << format("0x%" PRIx32, p) << "\n";
5463 outs() << " version " << module.version << "\n";
5464 outs() << " size " << module.size << "\n";
5466 name = get_pointer_32(module.name, xoffset, left, xS, &info, true);
5467 if (name != nullptr)
5468 outs() << format("%.*s", left, name);
5470 outs() << format("0x%08" PRIx32, module.name)
5471 << "(not in an __OBJC section)";
5474 r = get_pointer_32(module.symtab, xoffset, left, xS, &info, true);
5475 if (module.symtab == 0 || r == nullptr) {
5476 outs() << " symtab " << format("0x%08" PRIx32, module.symtab)
5477 << " (not in an __OBJC section)\n";
5480 outs() << " symtab " << format("0x%08" PRIx32, module.symtab) << "\n";
5481 memset(&symtab, '\0', sizeof(struct objc_symtab_t));
5484 if (left < sizeof(struct objc_symtab_t)) {
5485 memcpy(&symtab, r, left);
5486 outs() << "\tsymtab extends past end of an __OBJC section)\n";
5488 memcpy(&symtab, r, sizeof(struct objc_symtab_t));
5489 if (left > sizeof(struct objc_symtab_t)) {
5490 defs_left = left - sizeof(struct objc_symtab_t);
5491 defs = r + sizeof(struct objc_symtab_t);
5494 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5497 outs() << "\tsel_ref_cnt " << symtab.sel_ref_cnt << "\n";
5498 r = get_pointer_32(symtab.refs, xoffset, left, xS, &info, true);
5499 outs() << "\trefs " << format("0x%08" PRIx32, symtab.refs);
5501 outs() << " (not in an __OBJC section)";
5503 outs() << "\tcls_def_cnt " << symtab.cls_def_cnt << "\n";
5504 outs() << "\tcat_def_cnt " << symtab.cat_def_cnt << "\n";
5505 if (symtab.cls_def_cnt > 0)
5506 outs() << "\tClass Definitions\n";
5507 for (j = 0; j < symtab.cls_def_cnt; j++) {
5508 if ((j + 1) * sizeof(uint32_t) > defs_left) {
5509 outs() << "\t(remaining class defs entries entends past the end of the "
5513 memcpy(&def, defs + j * sizeof(uint32_t), sizeof(uint32_t));
5514 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5515 sys::swapByteOrder(def);
5517 r = get_pointer_32(def, xoffset, left, xS, &info, true);
5518 outs() << "\tdefs[" << j << "] " << format("0x%08" PRIx32, def);
5520 if (left > sizeof(struct objc_class_t)) {
5522 memcpy(&objc_class, r, sizeof(struct objc_class_t));
5524 outs() << " (entends past the end of the section)\n";
5525 memset(&objc_class, '\0', sizeof(struct objc_class_t));
5526 memcpy(&objc_class, r, left);
5528 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5529 swapStruct(objc_class);
5530 print_objc_class_t(&objc_class, &info);
5532 outs() << "(not in an __OBJC section)\n";
5535 if (CLS_GETINFO(&objc_class, CLS_CLASS)) {
5536 outs() << "\tMeta Class";
5537 r = get_pointer_32(objc_class.isa, xoffset, left, xS, &info, true);
5539 if (left > sizeof(struct objc_class_t)) {
5541 memcpy(&objc_class, r, sizeof(struct objc_class_t));
5543 outs() << " (entends past the end of the section)\n";
5544 memset(&objc_class, '\0', sizeof(struct objc_class_t));
5545 memcpy(&objc_class, r, left);
5547 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5548 swapStruct(objc_class);
5549 print_objc_class_t(&objc_class, &info);
5551 outs() << "(not in an __OBJC section)\n";
5555 if (symtab.cat_def_cnt > 0)
5556 outs() << "\tCategory Definitions\n";
5557 for (j = 0; j < symtab.cat_def_cnt; j++) {
5558 if ((j + symtab.cls_def_cnt + 1) * sizeof(uint32_t) > defs_left) {
5559 outs() << "\t(remaining category defs entries entends past the end of "
5560 << "the section)\n";
5563 memcpy(&def, defs + (j + symtab.cls_def_cnt) * sizeof(uint32_t),
5565 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5566 sys::swapByteOrder(def);
5568 r = get_pointer_32(def, xoffset, left, xS, &info, true);
5569 outs() << "\tdefs[" << j + symtab.cls_def_cnt << "] "
5570 << format("0x%08" PRIx32, def);
5572 if (left > sizeof(struct objc_category_t)) {
5574 memcpy(&objc_category, r, sizeof(struct objc_category_t));
5576 outs() << " (entends past the end of the section)\n";
5577 memset(&objc_category, '\0', sizeof(struct objc_category_t));
5578 memcpy(&objc_category, r, left);
5580 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5581 swapStruct(objc_category);
5582 print_objc_objc_category_t(&objc_category, &info);
5584 outs() << "(not in an __OBJC section)\n";
5588 const SectionRef II = get_section(O, "__OBJC", "__image_info");
5589 if (II != SectionRef())
5590 print_image_info(II, &info);
5595 static void DumpProtocolSection(MachOObjectFile *O, const char *sect,
5596 uint32_t size, uint32_t addr) {
5597 SymbolAddressMap AddrMap;
5598 CreateSymbolAddressMap(O, &AddrMap);
5600 std::vector<SectionRef> Sections;
5601 for (const SectionRef &Section : O->sections()) {
5603 Section.getName(SectName);
5604 Sections.push_back(Section);
5607 struct DisassembleInfo info;
5608 // Set up the block of info used by the Symbolizer call backs.
5609 info.verbose = true;
5611 info.AddrMap = &AddrMap;
5612 info.Sections = &Sections;
5613 info.class_name = nullptr;
5614 info.selector_name = nullptr;
5615 info.method = nullptr;
5616 info.demangled_name = nullptr;
5617 info.bindtable = nullptr;
5622 struct objc_protocol_t protocol;
5623 uint32_t left, paddr;
5624 for (p = sect; p < sect + size; p += sizeof(struct objc_protocol_t)) {
5625 memset(&protocol, '\0', sizeof(struct objc_protocol_t));
5626 left = size - (p - sect);
5627 if (left < sizeof(struct objc_protocol_t)) {
5628 outs() << "Protocol extends past end of __protocol section\n";
5629 memcpy(&protocol, p, left);
5631 memcpy(&protocol, p, sizeof(struct objc_protocol_t));
5632 if (O->isLittleEndian() != sys::IsLittleEndianHost)
5633 swapStruct(protocol);
5634 paddr = addr + (p - sect);
5635 outs() << "Protocol " << format("0x%" PRIx32, paddr);
5636 if (print_protocol(paddr, 0, &info))
5637 outs() << "(not in an __OBJC section)\n";
5642 inline void swapStruct(struct xar_header &xar) {
5643 sys::swapByteOrder(xar.magic);
5644 sys::swapByteOrder(xar.size);
5645 sys::swapByteOrder(xar.version);
5646 sys::swapByteOrder(xar.toc_length_compressed);
5647 sys::swapByteOrder(xar.toc_length_uncompressed);
5648 sys::swapByteOrder(xar.cksum_alg);
5651 static void PrintModeVerbose(uint32_t mode) {
5652 switch(mode & S_IFMT){
5676 /* owner permissions */
5687 else if(mode & S_IEXEC)
5692 /* group permissions */
5693 if(mode & (S_IREAD >> 3))
5697 if(mode & (S_IWRITE >> 3))
5703 else if(mode & (S_IEXEC >> 3))
5708 /* other permissions */
5709 if(mode & (S_IREAD >> 6))
5713 if(mode & (S_IWRITE >> 6))
5719 else if(mode & (S_IEXEC >> 6))
5725 static void PrintXarFilesSummary(const char *XarFilename, xar_t xar) {
5729 const char *key, *type, *mode, *user, *group, *size, *mtime, *name, *m;
5731 uint32_t mode_value;
5733 xi = xar_iter_new();
5735 errs() << "Can't obtain an xar iterator for xar archive "
5736 << XarFilename << "\n";
5740 // Go through the xar's files.
5741 for (xf = xar_file_first(xar, xi); xf; xf = xar_file_next(xi)) {
5742 xp = xar_iter_new();
5744 errs() << "Can't obtain an xar iterator for xar archive "
5745 << XarFilename << "\n";
5755 for(key = xar_prop_first(xf, xp); key; key = xar_prop_next(xp)){
5756 const char *val = nullptr;
5757 xar_prop_get(xf, key, &val);
5758 #if 0 // Useful for debugging.
5759 outs() << "key: " << key << " value: " << val << "\n";
5761 if(strcmp(key, "type") == 0)
5763 if(strcmp(key, "mode") == 0)
5765 if(strcmp(key, "user") == 0)
5767 if(strcmp(key, "group") == 0)
5769 if(strcmp(key, "data/size") == 0)
5771 if(strcmp(key, "mtime") == 0)
5773 if(strcmp(key, "name") == 0)
5776 if(mode != nullptr){
5777 mode_value = strtoul(mode, &endp, 8);
5779 outs() << "(mode: \"" << mode << "\" contains non-octal chars) ";
5780 if(strcmp(type, "file") == 0)
5781 mode_value |= S_IFREG;
5782 PrintModeVerbose(mode_value);
5786 outs() << format("%10s/", user);
5787 if(group != nullptr)
5788 outs() << format("%-10s ", group);
5790 outs() << format("%7s ", size);
5791 if(mtime != nullptr){
5792 for(m = mtime; *m != 'T' && *m != '\0'; m++)
5797 for( ; *m != 'Z' && *m != '\0'; m++)
5807 static void DumpBitcodeSection(MachOObjectFile *O, const char *sect,
5808 uint32_t size, bool verbose,
5809 bool PrintXarHeader, bool PrintXarFileHeaders,
5810 std::string XarMemberName) {
5811 if(size < sizeof(struct xar_header)) {
5812 outs() << "size of (__LLVM,__bundle) section too small (smaller than size "
5813 "of struct xar_header)\n";
5816 struct xar_header XarHeader;
5817 memcpy(&XarHeader, sect, sizeof(struct xar_header));
5818 if (sys::IsLittleEndianHost)
5819 swapStruct(XarHeader);
5820 if (PrintXarHeader) {
5821 if (!XarMemberName.empty())
5822 outs() << "In xar member " << XarMemberName << ": ";
5824 outs() << "For (__LLVM,__bundle) section: ";
5825 outs() << "xar header\n";
5826 if (XarHeader.magic == XAR_HEADER_MAGIC)
5827 outs() << " magic XAR_HEADER_MAGIC\n";
5830 << format_hex(XarHeader.magic, 10, true)
5831 << " (not XAR_HEADER_MAGIC)\n";
5832 outs() << " size " << XarHeader.size << "\n";
5833 outs() << " version " << XarHeader.version << "\n";
5834 outs() << " toc_length_compressed " << XarHeader.toc_length_compressed
5836 outs() << "toc_length_uncompressed " << XarHeader.toc_length_uncompressed
5838 outs() << " cksum_alg ";
5839 switch (XarHeader.cksum_alg) {
5840 case XAR_CKSUM_NONE:
5841 outs() << "XAR_CKSUM_NONE\n";
5843 case XAR_CKSUM_SHA1:
5844 outs() << "XAR_CKSUM_SHA1\n";
5847 outs() << "XAR_CKSUM_MD5\n";
5849 #ifdef XAR_CKSUM_SHA256
5850 case XAR_CKSUM_SHA256:
5851 outs() << "XAR_CKSUM_SHA256\n";
5854 #ifdef XAR_CKSUM_SHA512
5855 case XAR_CKSUM_SHA512:
5856 outs() << "XAR_CKSUM_SHA512\n";
5860 outs() << XarHeader.cksum_alg << "\n";
5864 SmallString<128> XarFilename;
5866 std::error_code XarEC =
5867 sys::fs::createTemporaryFile("llvm-objdump", "xar", FD, XarFilename);
5869 errs() << XarEC.message() << "\n";
5872 tool_output_file XarFile(XarFilename, FD);
5873 raw_fd_ostream &XarOut = XarFile.os();
5874 StringRef XarContents(sect, size);
5875 XarOut << XarContents;
5877 if (XarOut.has_error())
5880 xar_t xar = xar_open(XarFilename.c_str(), READ);
5882 errs() << "Can't create temporary xar archive " << XarFilename << "\n";
5886 SmallString<128> TocFilename;
5887 std::error_code TocEC =
5888 sys::fs::createTemporaryFile("llvm-objdump", "toc", TocFilename);
5890 errs() << TocEC.message() << "\n";
5893 xar_serialize(xar, TocFilename.c_str());
5895 if (PrintXarFileHeaders) {
5896 if (!XarMemberName.empty())
5897 outs() << "In xar member " << XarMemberName << ": ";
5899 outs() << "For (__LLVM,__bundle) section: ";
5900 outs() << "xar archive files:\n";
5901 PrintXarFilesSummary(XarFilename.c_str(), xar);
5904 ErrorOr<std::unique_ptr<MemoryBuffer>> FileOrErr =
5905 MemoryBuffer::getFileOrSTDIN(TocFilename.c_str());
5906 if (std::error_code EC = FileOrErr.getError()) {
5907 errs() << EC.message() << "\n";
5910 std::unique_ptr<MemoryBuffer> &Buffer = FileOrErr.get();
5912 if (!XarMemberName.empty())
5913 outs() << "In xar member " << XarMemberName << ": ";
5915 outs() << "For (__LLVM,__bundle) section: ";
5916 outs() << "xar table of contents:\n";
5917 outs() << Buffer->getBuffer() << "\n";
5919 // TODO: Go through the xar's files.
5920 xar_iter_t xi = xar_iter_new();
5922 errs() << "Can't obtain an xar iterator for xar archive "
5923 << XarFilename.c_str() << "\n";
5927 for(xar_file_t xf = xar_file_first(xar, xi); xf; xf = xar_file_next(xi)){
5930 const char *member_name, *member_type, *member_size_string;
5933 xp = xar_iter_new();
5935 errs() << "Can't obtain an xar iterator for xar archive "
5936 << XarFilename.c_str() << "\n";
5942 member_size_string = NULL;
5943 for(key = xar_prop_first(xf, xp); key; key = xar_prop_next(xp)){
5944 const char *val = nullptr;
5945 xar_prop_get(xf, key, &val);
5946 #if 0 // Useful for debugging.
5947 outs() << "key: " << key << " value: " << val << "\n";
5949 if(strcmp(key, "name") == 0)
5951 if(strcmp(key, "type") == 0)
5953 if(strcmp(key, "data/size") == 0)
5954 member_size_string = val;
5957 * If we find a file with a name, date/size and type properties
5958 * and with the type being "file" see if that is a xar file.
5960 if (member_name != NULL && member_type != NULL &&
5961 strcmp(member_type, "file") == 0 &&
5962 member_size_string != NULL){
5963 // Extract the file into a buffer.
5965 member_size = strtoul(member_size_string, &endptr, 10);
5966 if (*endptr == '\0' && member_size != 0) {
5967 char *buffer = (char *) ::operator new (member_size);
5968 if (xar_extract_tobuffersz(xar, xf, &buffer, &member_size) == 0) {
5969 #if 0 // Useful for debugging.
5970 outs() << "xar member: " << member_name << " extracted\n";
5972 // Set the XarMemberName we want to see printed in the header.
5973 std::string OldXarMemberName;
5974 // If XarMemberName is already set this is nested. So
5975 // save the old name and create the nested name.
5976 if (!XarMemberName.empty()) {
5977 OldXarMemberName = XarMemberName;
5979 (Twine("[") + XarMemberName + "]" + member_name).str();
5981 OldXarMemberName = "";
5982 XarMemberName = member_name;
5984 // See if this is could be a xar file (nested).
5985 if (member_size >= sizeof(struct xar_header)) {
5986 #if 0 // Useful for debugging.
5987 outs() << "could be a xar file: " << member_name << "\n";
5989 memcpy((char *)&XarHeader, buffer, sizeof(struct xar_header));
5990 if (sys::IsLittleEndianHost)
5991 swapStruct(XarHeader);
5992 if(XarHeader.magic == XAR_HEADER_MAGIC)
5993 DumpBitcodeSection(O, buffer, member_size, verbose,
5994 PrintXarHeader, PrintXarFileHeaders,
5997 XarMemberName = OldXarMemberName;
6006 #endif // defined(HAVE_LIBXAR)
6008 static void printObjcMetaData(MachOObjectFile *O, bool verbose) {
6010 printObjc2_64bit_MetaData(O, verbose);
6012 MachO::mach_header H;
6014 if (H.cputype == MachO::CPU_TYPE_ARM)
6015 printObjc2_32bit_MetaData(O, verbose);
6017 // This is the 32-bit non-arm cputype case. Which is normally
6018 // the first Objective-C ABI. But it may be the case of a
6019 // binary for the iOS simulator which is the second Objective-C
6020 // ABI. In that case printObjc1_32bit_MetaData() will determine that
6021 // and return false.
6022 if (!printObjc1_32bit_MetaData(O, verbose))
6023 printObjc2_32bit_MetaData(O, verbose);
6028 // GuessLiteralPointer returns a string which for the item in the Mach-O file
6029 // for the address passed in as ReferenceValue for printing as a comment with
6030 // the instruction and also returns the corresponding type of that item
6031 // indirectly through ReferenceType.
6033 // If ReferenceValue is an address of literal cstring then a pointer to the
6034 // cstring is returned and ReferenceType is set to
6035 // LLVMDisassembler_ReferenceType_Out_LitPool_CstrAddr .
6037 // If ReferenceValue is an address of an Objective-C CFString, Selector ref or
6038 // Class ref that name is returned and the ReferenceType is set accordingly.
6040 // Lastly, literals which are Symbol address in a literal pool are looked for
6041 // and if found the symbol name is returned and ReferenceType is set to
6042 // LLVMDisassembler_ReferenceType_Out_LitPool_SymAddr .
6044 // If there is no item in the Mach-O file for the address passed in as
6045 // ReferenceValue nullptr is returned and ReferenceType is unchanged.
6046 static const char *GuessLiteralPointer(uint64_t ReferenceValue,
6047 uint64_t ReferencePC,
6048 uint64_t *ReferenceType,
6049 struct DisassembleInfo *info) {
6050 // First see if there is an external relocation entry at the ReferencePC.
6051 if (info->O->getHeader().filetype == MachO::MH_OBJECT) {
6052 uint64_t sect_addr = info->S.getAddress();
6053 uint64_t sect_offset = ReferencePC - sect_addr;
6054 bool reloc_found = false;
6056 MachO::any_relocation_info RE;
6057 bool isExtern = false;
6059 for (const RelocationRef &Reloc : info->S.relocations()) {
6060 uint64_t RelocOffset = Reloc.getOffset();
6061 if (RelocOffset == sect_offset) {
6062 Rel = Reloc.getRawDataRefImpl();
6063 RE = info->O->getRelocation(Rel);
6064 if (info->O->isRelocationScattered(RE))
6066 isExtern = info->O->getPlainRelocationExternal(RE);
6068 symbol_iterator RelocSym = Reloc.getSymbol();
6075 // If there is an external relocation entry for a symbol in a section
6076 // then used that symbol's value for the value of the reference.
6077 if (reloc_found && isExtern) {
6078 if (info->O->getAnyRelocationPCRel(RE)) {
6079 unsigned Type = info->O->getAnyRelocationType(RE);
6080 if (Type == MachO::X86_64_RELOC_SIGNED) {
6081 ReferenceValue = Symbol.getValue();
6087 // Look for literals such as Objective-C CFStrings refs, Selector refs,
6088 // Message refs and Class refs.
6089 bool classref, selref, msgref, cfstring;
6090 uint64_t pointer_value = GuessPointerPointer(ReferenceValue, info, classref,
6091 selref, msgref, cfstring);
6092 if (classref && pointer_value == 0) {
6093 // Note the ReferenceValue is a pointer into the __objc_classrefs section.
6094 // And the pointer_value in that section is typically zero as it will be
6095 // set by dyld as part of the "bind information".
6096 const char *name = get_dyld_bind_info_symbolname(ReferenceValue, info);
6097 if (name != nullptr) {
6098 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Class_Ref;
6099 const char *class_name = strrchr(name, '$');
6100 if (class_name != nullptr && class_name[1] == '_' &&
6101 class_name[2] != '\0') {
6102 info->class_name = class_name + 2;
6109 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Class_Ref;
6111 get_objc2_64bit_class_name(pointer_value, ReferenceValue, info);
6112 if (name != nullptr)
6113 info->class_name = name;
6115 name = "bad class ref";
6120 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_CFString_Ref;
6121 const char *name = get_objc2_64bit_cfstring_name(ReferenceValue, info);
6125 if (selref && pointer_value == 0)
6126 pointer_value = get_objc2_64bit_selref(ReferenceValue, info);
6128 if (pointer_value != 0)
6129 ReferenceValue = pointer_value;
6131 const char *name = GuessCstringPointer(ReferenceValue, info);
6133 if (pointer_value != 0 && selref) {
6134 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Selector_Ref;
6135 info->selector_name = name;
6136 } else if (pointer_value != 0 && msgref) {
6137 info->class_name = nullptr;
6138 *ReferenceType = LLVMDisassembler_ReferenceType_Out_Objc_Message_Ref;
6139 info->selector_name = name;
6141 *ReferenceType = LLVMDisassembler_ReferenceType_Out_LitPool_CstrAddr;
6145 // Lastly look for an indirect symbol with this ReferenceValue which is in
6146 // a literal pool. If found return that symbol name.
6147 name = GuessIndirectSymbol(ReferenceValue, info);
6149 *ReferenceType = LLVMDisassembler_ReferenceType_Out_LitPool_SymAddr;
6156 // SymbolizerSymbolLookUp is the symbol lookup function passed when creating
6157 // the Symbolizer. It looks up the ReferenceValue using the info passed via the
6158 // pointer to the struct DisassembleInfo that was passed when MCSymbolizer
6159 // is created and returns the symbol name that matches the ReferenceValue or
6160 // nullptr if none. The ReferenceType is passed in for the IN type of
6161 // reference the instruction is making from the values in defined in the header
6162 // "llvm-c/Disassembler.h". On return the ReferenceType can set to a specific
6163 // Out type and the ReferenceName will also be set which is added as a comment
6164 // to the disassembled instruction.
6166 // If the symbol name is a C++ mangled name then the demangled name is
6167 // returned through ReferenceName and ReferenceType is set to
6168 // LLVMDisassembler_ReferenceType_DeMangled_Name .
6170 // When this is called to get a symbol name for a branch target then the
6171 // ReferenceType will be LLVMDisassembler_ReferenceType_In_Branch and then
6172 // SymbolValue will be looked for in the indirect symbol table to determine if
6173 // it is an address for a symbol stub. If so then the symbol name for that
6174 // stub is returned indirectly through ReferenceName and then ReferenceType is
6175 // set to LLVMDisassembler_ReferenceType_Out_SymbolStub.
6177 // When this is called with an value loaded via a PC relative load then
6178 // ReferenceType will be LLVMDisassembler_ReferenceType_In_PCrel_Load then the
6179 // SymbolValue is checked to be an address of literal pointer, symbol pointer,
6180 // or an Objective-C meta data reference. If so the output ReferenceType is
6181 // set to correspond to that as well as setting the ReferenceName.
6182 static const char *SymbolizerSymbolLookUp(void *DisInfo,
6183 uint64_t ReferenceValue,
6184 uint64_t *ReferenceType,
6185 uint64_t ReferencePC,
6186 const char **ReferenceName) {
6187 struct DisassembleInfo *info = (struct DisassembleInfo *)DisInfo;
6188 // If no verbose symbolic information is wanted then just return nullptr.
6189 if (!info->verbose) {
6190 *ReferenceName = nullptr;
6191 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6195 const char *SymbolName = GuessSymbolName(ReferenceValue, info->AddrMap);
6197 if (*ReferenceType == LLVMDisassembler_ReferenceType_In_Branch) {
6198 *ReferenceName = GuessIndirectSymbol(ReferenceValue, info);
6199 if (*ReferenceName != nullptr) {
6200 method_reference(info, ReferenceType, ReferenceName);
6201 if (*ReferenceType != LLVMDisassembler_ReferenceType_Out_Objc_Message)
6202 *ReferenceType = LLVMDisassembler_ReferenceType_Out_SymbolStub;
6203 } else if (SymbolName != nullptr && strncmp(SymbolName, "__Z", 3) == 0) {
6204 if (info->demangled_name != nullptr)
6205 free(info->demangled_name);
6207 info->demangled_name =
6208 itaniumDemangle(SymbolName + 1, nullptr, nullptr, &status);
6209 if (info->demangled_name != nullptr) {
6210 *ReferenceName = info->demangled_name;
6211 *ReferenceType = LLVMDisassembler_ReferenceType_DeMangled_Name;
6213 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6215 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6216 } else if (*ReferenceType == LLVMDisassembler_ReferenceType_In_PCrel_Load) {
6218 GuessLiteralPointer(ReferenceValue, ReferencePC, ReferenceType, info);
6220 method_reference(info, ReferenceType, ReferenceName);
6222 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6223 // If this is arm64 and the reference is an adrp instruction save the
6224 // instruction, passed in ReferenceValue and the address of the instruction
6225 // for use later if we see and add immediate instruction.
6226 } else if (info->O->getArch() == Triple::aarch64 &&
6227 *ReferenceType == LLVMDisassembler_ReferenceType_In_ARM64_ADRP) {
6228 info->adrp_inst = ReferenceValue;
6229 info->adrp_addr = ReferencePC;
6230 SymbolName = nullptr;
6231 *ReferenceName = nullptr;
6232 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6233 // If this is arm64 and reference is an add immediate instruction and we
6235 // seen an adrp instruction just before it and the adrp's Xd register
6237 // this add's Xn register reconstruct the value being referenced and look to
6238 // see if it is a literal pointer. Note the add immediate instruction is
6239 // passed in ReferenceValue.
6240 } else if (info->O->getArch() == Triple::aarch64 &&
6241 *ReferenceType == LLVMDisassembler_ReferenceType_In_ARM64_ADDXri &&
6242 ReferencePC - 4 == info->adrp_addr &&
6243 (info->adrp_inst & 0x9f000000) == 0x90000000 &&
6244 (info->adrp_inst & 0x1f) == ((ReferenceValue >> 5) & 0x1f)) {
6245 uint32_t addxri_inst;
6246 uint64_t adrp_imm, addxri_imm;
6249 ((info->adrp_inst & 0x00ffffe0) >> 3) | ((info->adrp_inst >> 29) & 0x3);
6250 if (info->adrp_inst & 0x0200000)
6251 adrp_imm |= 0xfffffffffc000000LL;
6253 addxri_inst = ReferenceValue;
6254 addxri_imm = (addxri_inst >> 10) & 0xfff;
6255 if (((addxri_inst >> 22) & 0x3) == 1)
6258 ReferenceValue = (info->adrp_addr & 0xfffffffffffff000LL) +
6259 (adrp_imm << 12) + addxri_imm;
6262 GuessLiteralPointer(ReferenceValue, ReferencePC, ReferenceType, info);
6263 if (*ReferenceName == nullptr)
6264 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6265 // If this is arm64 and the reference is a load register instruction and we
6266 // have seen an adrp instruction just before it and the adrp's Xd register
6267 // matches this add's Xn register reconstruct the value being referenced and
6268 // look to see if it is a literal pointer. Note the load register
6269 // instruction is passed in ReferenceValue.
6270 } else if (info->O->getArch() == Triple::aarch64 &&
6271 *ReferenceType == LLVMDisassembler_ReferenceType_In_ARM64_LDRXui &&
6272 ReferencePC - 4 == info->adrp_addr &&
6273 (info->adrp_inst & 0x9f000000) == 0x90000000 &&
6274 (info->adrp_inst & 0x1f) == ((ReferenceValue >> 5) & 0x1f)) {
6275 uint32_t ldrxui_inst;
6276 uint64_t adrp_imm, ldrxui_imm;
6279 ((info->adrp_inst & 0x00ffffe0) >> 3) | ((info->adrp_inst >> 29) & 0x3);
6280 if (info->adrp_inst & 0x0200000)
6281 adrp_imm |= 0xfffffffffc000000LL;
6283 ldrxui_inst = ReferenceValue;
6284 ldrxui_imm = (ldrxui_inst >> 10) & 0xfff;
6286 ReferenceValue = (info->adrp_addr & 0xfffffffffffff000LL) +
6287 (adrp_imm << 12) + (ldrxui_imm << 3);
6290 GuessLiteralPointer(ReferenceValue, ReferencePC, ReferenceType, info);
6291 if (*ReferenceName == nullptr)
6292 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6294 // If this arm64 and is an load register (PC-relative) instruction the
6295 // ReferenceValue is the PC plus the immediate value.
6296 else if (info->O->getArch() == Triple::aarch64 &&
6297 (*ReferenceType == LLVMDisassembler_ReferenceType_In_ARM64_LDRXl ||
6298 *ReferenceType == LLVMDisassembler_ReferenceType_In_ARM64_ADR)) {
6300 GuessLiteralPointer(ReferenceValue, ReferencePC, ReferenceType, info);
6301 if (*ReferenceName == nullptr)
6302 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6303 } else if (SymbolName != nullptr && strncmp(SymbolName, "__Z", 3) == 0) {
6304 if (info->demangled_name != nullptr)
6305 free(info->demangled_name);
6307 info->demangled_name =
6308 itaniumDemangle(SymbolName + 1, nullptr, nullptr, &status);
6309 if (info->demangled_name != nullptr) {
6310 *ReferenceName = info->demangled_name;
6311 *ReferenceType = LLVMDisassembler_ReferenceType_DeMangled_Name;
6315 *ReferenceName = nullptr;
6316 *ReferenceType = LLVMDisassembler_ReferenceType_InOut_None;
6322 /// \brief Emits the comments that are stored in the CommentStream.
6323 /// Each comment in the CommentStream must end with a newline.
6324 static void emitComments(raw_svector_ostream &CommentStream,
6325 SmallString<128> &CommentsToEmit,
6326 formatted_raw_ostream &FormattedOS,
6327 const MCAsmInfo &MAI) {
6328 // Flush the stream before taking its content.
6329 StringRef Comments = CommentsToEmit.str();
6330 // Get the default information for printing a comment.
6331 StringRef CommentBegin = MAI.getCommentString();
6332 unsigned CommentColumn = MAI.getCommentColumn();
6333 bool IsFirst = true;
6334 while (!Comments.empty()) {
6336 FormattedOS << '\n';
6337 // Emit a line of comments.
6338 FormattedOS.PadToColumn(CommentColumn);
6339 size_t Position = Comments.find('\n');
6340 FormattedOS << CommentBegin << ' ' << Comments.substr(0, Position);
6341 // Move after the newline character.
6342 Comments = Comments.substr(Position + 1);
6345 FormattedOS.flush();
6347 // Tell the comment stream that the vector changed underneath it.
6348 CommentsToEmit.clear();
6351 static void DisassembleMachO(StringRef Filename, MachOObjectFile *MachOOF,
6352 StringRef DisSegName, StringRef DisSectName) {
6353 const char *McpuDefault = nullptr;
6354 const Target *ThumbTarget = nullptr;
6355 const Target *TheTarget = GetTarget(MachOOF, &McpuDefault, &ThumbTarget);
6357 // GetTarget prints out stuff.
6360 if (MCPU.empty() && McpuDefault)
6363 std::unique_ptr<const MCInstrInfo> InstrInfo(TheTarget->createMCInstrInfo());
6364 std::unique_ptr<const MCInstrInfo> ThumbInstrInfo;
6366 ThumbInstrInfo.reset(ThumbTarget->createMCInstrInfo());
6368 // Package up features to be passed to target/subtarget
6369 std::string FeaturesStr;
6370 if (MAttrs.size()) {
6371 SubtargetFeatures Features;
6372 for (unsigned i = 0; i != MAttrs.size(); ++i)
6373 Features.AddFeature(MAttrs[i]);
6374 FeaturesStr = Features.getString();
6377 // Set up disassembler.
6378 std::unique_ptr<const MCRegisterInfo> MRI(
6379 TheTarget->createMCRegInfo(TripleName));
6380 std::unique_ptr<const MCAsmInfo> AsmInfo(
6381 TheTarget->createMCAsmInfo(*MRI, TripleName));
6382 std::unique_ptr<const MCSubtargetInfo> STI(
6383 TheTarget->createMCSubtargetInfo(TripleName, MCPU, FeaturesStr));
6384 MCContext Ctx(AsmInfo.get(), MRI.get(), nullptr);
6385 std::unique_ptr<MCDisassembler> DisAsm(
6386 TheTarget->createMCDisassembler(*STI, Ctx));
6387 std::unique_ptr<MCSymbolizer> Symbolizer;
6388 struct DisassembleInfo SymbolizerInfo;
6389 std::unique_ptr<MCRelocationInfo> RelInfo(
6390 TheTarget->createMCRelocationInfo(TripleName, Ctx));
6392 Symbolizer.reset(TheTarget->createMCSymbolizer(
6393 TripleName, SymbolizerGetOpInfo, SymbolizerSymbolLookUp,
6394 &SymbolizerInfo, &Ctx, std::move(RelInfo)));
6395 DisAsm->setSymbolizer(std::move(Symbolizer));
6397 int AsmPrinterVariant = AsmInfo->getAssemblerDialect();
6398 std::unique_ptr<MCInstPrinter> IP(TheTarget->createMCInstPrinter(
6399 Triple(TripleName), AsmPrinterVariant, *AsmInfo, *InstrInfo, *MRI));
6400 // Set the display preference for hex vs. decimal immediates.
6401 IP->setPrintImmHex(PrintImmHex);
6402 // Comment stream and backing vector.
6403 SmallString<128> CommentsToEmit;
6404 raw_svector_ostream CommentStream(CommentsToEmit);
6405 // FIXME: Setting the CommentStream in the InstPrinter is problematic in that
6406 // if it is done then arm64 comments for string literals don't get printed
6407 // and some constant get printed instead and not setting it causes intel
6408 // (32-bit and 64-bit) comments printed with different spacing before the
6409 // comment causing different diffs with the 'C' disassembler library API.
6410 // IP->setCommentStream(CommentStream);
6412 if (!AsmInfo || !STI || !DisAsm || !IP) {
6413 errs() << "error: couldn't initialize disassembler for target "
6414 << TripleName << '\n';
6418 // Set up separate thumb disassembler if needed.
6419 std::unique_ptr<const MCRegisterInfo> ThumbMRI;
6420 std::unique_ptr<const MCAsmInfo> ThumbAsmInfo;
6421 std::unique_ptr<const MCSubtargetInfo> ThumbSTI;
6422 std::unique_ptr<MCDisassembler> ThumbDisAsm;
6423 std::unique_ptr<MCInstPrinter> ThumbIP;
6424 std::unique_ptr<MCContext> ThumbCtx;
6425 std::unique_ptr<MCSymbolizer> ThumbSymbolizer;
6426 struct DisassembleInfo ThumbSymbolizerInfo;
6427 std::unique_ptr<MCRelocationInfo> ThumbRelInfo;
6429 ThumbMRI.reset(ThumbTarget->createMCRegInfo(ThumbTripleName));
6431 ThumbTarget->createMCAsmInfo(*ThumbMRI, ThumbTripleName));
6433 ThumbTarget->createMCSubtargetInfo(ThumbTripleName, MCPU, FeaturesStr));
6434 ThumbCtx.reset(new MCContext(ThumbAsmInfo.get(), ThumbMRI.get(), nullptr));
6435 ThumbDisAsm.reset(ThumbTarget->createMCDisassembler(*ThumbSTI, *ThumbCtx));
6436 MCContext *PtrThumbCtx = ThumbCtx.get();
6438 ThumbTarget->createMCRelocationInfo(ThumbTripleName, *PtrThumbCtx));
6440 ThumbSymbolizer.reset(ThumbTarget->createMCSymbolizer(
6441 ThumbTripleName, SymbolizerGetOpInfo, SymbolizerSymbolLookUp,
6442 &ThumbSymbolizerInfo, PtrThumbCtx, std::move(ThumbRelInfo)));
6443 ThumbDisAsm->setSymbolizer(std::move(ThumbSymbolizer));
6445 int ThumbAsmPrinterVariant = ThumbAsmInfo->getAssemblerDialect();
6446 ThumbIP.reset(ThumbTarget->createMCInstPrinter(
6447 Triple(ThumbTripleName), ThumbAsmPrinterVariant, *ThumbAsmInfo,
6448 *ThumbInstrInfo, *ThumbMRI));
6449 // Set the display preference for hex vs. decimal immediates.
6450 ThumbIP->setPrintImmHex(PrintImmHex);
6453 if (ThumbTarget && (!ThumbAsmInfo || !ThumbSTI || !ThumbDisAsm || !ThumbIP)) {
6454 errs() << "error: couldn't initialize disassembler for target "
6455 << ThumbTripleName << '\n';
6459 MachO::mach_header Header = MachOOF->getHeader();
6461 // FIXME: Using the -cfg command line option, this code used to be able to
6462 // annotate relocations with the referenced symbol's name, and if this was
6463 // inside a __[cf]string section, the data it points to. This is now replaced
6464 // by the upcoming MCSymbolizer, which needs the appropriate setup done above.
6465 std::vector<SectionRef> Sections;
6466 std::vector<SymbolRef> Symbols;
6467 SmallVector<uint64_t, 8> FoundFns;
6468 uint64_t BaseSegmentAddress;
6470 getSectionsAndSymbols(MachOOF, Sections, Symbols, FoundFns,
6471 BaseSegmentAddress);
6473 // Sort the symbols by address, just in case they didn't come in that way.
6474 std::sort(Symbols.begin(), Symbols.end(), SymbolSorter());
6476 // Build a data in code table that is sorted on by the address of each entry.
6477 uint64_t BaseAddress = 0;
6478 if (Header.filetype == MachO::MH_OBJECT)
6479 BaseAddress = Sections[0].getAddress();
6481 BaseAddress = BaseSegmentAddress;
6483 for (dice_iterator DI = MachOOF->begin_dices(), DE = MachOOF->end_dices();
6486 DI->getOffset(Offset);
6487 Dices.push_back(std::make_pair(BaseAddress + Offset, *DI));
6489 array_pod_sort(Dices.begin(), Dices.end());
6492 raw_ostream &DebugOut = DebugFlag ? dbgs() : nulls();
6494 raw_ostream &DebugOut = nulls();
6497 std::unique_ptr<DIContext> diContext;
6498 ObjectFile *DbgObj = MachOOF;
6499 // Try to find debug info and set up the DIContext for it.
6501 // A separate DSym file path was specified, parse it as a macho file,
6502 // get the sections and supply it to the section name parsing machinery.
6503 if (!DSYMFile.empty()) {
6504 ErrorOr<std::unique_ptr<MemoryBuffer>> BufOrErr =
6505 MemoryBuffer::getFileOrSTDIN(DSYMFile);
6506 if (std::error_code EC = BufOrErr.getError()) {
6507 errs() << "llvm-objdump: " << Filename << ": " << EC.message() << '\n';
6511 ObjectFile::createMachOObjectFile(BufOrErr.get()->getMemBufferRef())
6516 // Setup the DIContext
6517 diContext.reset(new DWARFContextInMemory(*DbgObj));
6520 if (FilterSections.size() == 0)
6521 outs() << "(" << DisSegName << "," << DisSectName << ") section\n";
6523 for (unsigned SectIdx = 0; SectIdx != Sections.size(); SectIdx++) {
6525 if (Sections[SectIdx].getName(SectName) || SectName != DisSectName)
6528 DataRefImpl DR = Sections[SectIdx].getRawDataRefImpl();
6530 StringRef SegmentName = MachOOF->getSectionFinalSegmentName(DR);
6531 if (SegmentName != DisSegName)
6535 Sections[SectIdx].getContents(BytesStr);
6536 ArrayRef<uint8_t> Bytes(reinterpret_cast<const uint8_t *>(BytesStr.data()),
6538 uint64_t SectAddress = Sections[SectIdx].getAddress();
6540 bool symbolTableWorked = false;
6542 // Create a map of symbol addresses to symbol names for use by
6543 // the SymbolizerSymbolLookUp() routine.
6544 SymbolAddressMap AddrMap;
6545 bool DisSymNameFound = false;
6546 for (const SymbolRef &Symbol : MachOOF->symbols()) {
6547 Expected<SymbolRef::Type> STOrErr = Symbol.getType();
6549 report_error(MachOOF->getFileName(), STOrErr.takeError());
6550 SymbolRef::Type ST = *STOrErr;
6551 if (ST == SymbolRef::ST_Function || ST == SymbolRef::ST_Data ||
6552 ST == SymbolRef::ST_Other) {
6553 uint64_t Address = Symbol.getValue();
6554 Expected<StringRef> SymNameOrErr = Symbol.getName();
6556 report_error(MachOOF->getFileName(), SymNameOrErr.takeError());
6557 StringRef SymName = *SymNameOrErr;
6558 AddrMap[Address] = SymName;
6559 if (!DisSymName.empty() && DisSymName == SymName)
6560 DisSymNameFound = true;
6563 if (!DisSymName.empty() && !DisSymNameFound) {
6564 outs() << "Can't find -dis-symname: " << DisSymName << "\n";
6567 // Set up the block of info used by the Symbolizer call backs.
6568 SymbolizerInfo.verbose = !NoSymbolicOperands;
6569 SymbolizerInfo.O = MachOOF;
6570 SymbolizerInfo.S = Sections[SectIdx];
6571 SymbolizerInfo.AddrMap = &AddrMap;
6572 SymbolizerInfo.Sections = &Sections;
6573 SymbolizerInfo.class_name = nullptr;
6574 SymbolizerInfo.selector_name = nullptr;
6575 SymbolizerInfo.method = nullptr;
6576 SymbolizerInfo.demangled_name = nullptr;
6577 SymbolizerInfo.bindtable = nullptr;
6578 SymbolizerInfo.adrp_addr = 0;
6579 SymbolizerInfo.adrp_inst = 0;
6580 // Same for the ThumbSymbolizer
6581 ThumbSymbolizerInfo.verbose = !NoSymbolicOperands;
6582 ThumbSymbolizerInfo.O = MachOOF;
6583 ThumbSymbolizerInfo.S = Sections[SectIdx];
6584 ThumbSymbolizerInfo.AddrMap = &AddrMap;
6585 ThumbSymbolizerInfo.Sections = &Sections;
6586 ThumbSymbolizerInfo.class_name = nullptr;
6587 ThumbSymbolizerInfo.selector_name = nullptr;
6588 ThumbSymbolizerInfo.method = nullptr;
6589 ThumbSymbolizerInfo.demangled_name = nullptr;
6590 ThumbSymbolizerInfo.bindtable = nullptr;
6591 ThumbSymbolizerInfo.adrp_addr = 0;
6592 ThumbSymbolizerInfo.adrp_inst = 0;
6594 unsigned int Arch = MachOOF->getArch();
6596 // Skip all symbols if this is a stubs file.
6597 if (Bytes.size() == 0)
6600 // Disassemble symbol by symbol.
6601 for (unsigned SymIdx = 0; SymIdx != Symbols.size(); SymIdx++) {
6602 Expected<StringRef> SymNameOrErr = Symbols[SymIdx].getName();
6604 report_error(MachOOF->getFileName(), SymNameOrErr.takeError());
6605 StringRef SymName = *SymNameOrErr;
6607 Expected<SymbolRef::Type> STOrErr = Symbols[SymIdx].getType();
6609 report_error(MachOOF->getFileName(), STOrErr.takeError());
6610 SymbolRef::Type ST = *STOrErr;
6611 if (ST != SymbolRef::ST_Function && ST != SymbolRef::ST_Data)
6614 // Make sure the symbol is defined in this section.
6615 bool containsSym = Sections[SectIdx].containsSymbol(Symbols[SymIdx]);
6617 if (!DisSymName.empty() && DisSymName == SymName) {
6618 outs() << "-dis-symname: " << DisSymName << " not in the section\n";
6623 // The __mh_execute_header is special and we need to deal with that fact
6624 // this symbol is before the start of the (__TEXT,__text) section and at the
6625 // address of the start of the __TEXT segment. This is because this symbol
6626 // is an N_SECT symbol in the (__TEXT,__text) but its address is before the
6627 // start of the section in a standard MH_EXECUTE filetype.
6628 if (!DisSymName.empty() && DisSymName == "__mh_execute_header") {
6629 outs() << "-dis-symname: __mh_execute_header not in any section\n";
6632 // When this code is trying to disassemble a symbol at a time and in the
6633 // case there is only the __mh_execute_header symbol left as in a stripped
6634 // executable, we need to deal with this by ignoring this symbol so the
6635 // whole section is disassembled and this symbol is then not displayed.
6636 if (SymName == "__mh_execute_header" || SymName == "__mh_dylib_header" ||
6637 SymName == "__mh_bundle_header" || SymName == "__mh_object_header" ||
6638 SymName == "__mh_preload_header" || SymName == "__mh_dylinker_header")
6641 // If we are only disassembling one symbol see if this is that symbol.
6642 if (!DisSymName.empty() && DisSymName != SymName)
6645 // Start at the address of the symbol relative to the section's address.
6646 uint64_t SectSize = Sections[SectIdx].getSize();
6647 uint64_t Start = Symbols[SymIdx].getValue();
6648 uint64_t SectionAddress = Sections[SectIdx].getAddress();
6649 Start -= SectionAddress;
6651 if (Start > SectSize) {
6652 outs() << "section data ends, " << SymName
6653 << " lies outside valid range\n";
6657 // Stop disassembling either at the beginning of the next symbol or at
6658 // the end of the section.
6659 bool containsNextSym = false;
6660 uint64_t NextSym = 0;
6661 uint64_t NextSymIdx = SymIdx + 1;
6662 while (Symbols.size() > NextSymIdx) {
6663 Expected<SymbolRef::Type> STOrErr = Symbols[NextSymIdx].getType();
6665 report_error(MachOOF->getFileName(), STOrErr.takeError());
6666 SymbolRef::Type NextSymType = *STOrErr;
6667 if (NextSymType == SymbolRef::ST_Function) {
6669 Sections[SectIdx].containsSymbol(Symbols[NextSymIdx]);
6670 NextSym = Symbols[NextSymIdx].getValue();
6671 NextSym -= SectionAddress;
6677 uint64_t End = containsNextSym ? std::min(NextSym, SectSize) : SectSize;
6680 symbolTableWorked = true;
6682 DataRefImpl Symb = Symbols[SymIdx].getRawDataRefImpl();
6683 bool IsThumb = MachOOF->getSymbolFlags(Symb) & SymbolRef::SF_Thumb;
6685 // We only need the dedicated Thumb target if there's a real choice
6686 // (i.e. we're not targeting M-class) and the function is Thumb.
6687 bool UseThumbTarget = IsThumb && ThumbTarget;
6689 outs() << SymName << ":\n";
6690 DILineInfo lastLine;
6691 for (uint64_t Index = Start; Index < End; Index += Size) {
6694 uint64_t PC = SectAddress + Index;
6695 if (!NoLeadingAddr) {
6696 if (FullLeadingAddr) {
6697 if (MachOOF->is64Bit())
6698 outs() << format("%016" PRIx64, PC);
6700 outs() << format("%08" PRIx64, PC);
6702 outs() << format("%8" PRIx64 ":", PC);
6705 if (!NoShowRawInsn || Arch == Triple::arm)
6708 // Check the data in code table here to see if this is data not an
6709 // instruction to be disassembled.
6711 Dice.push_back(std::make_pair(PC, DiceRef()));
6712 dice_table_iterator DTI =
6713 std::search(Dices.begin(), Dices.end(), Dice.begin(), Dice.end(),
6714 compareDiceTableEntries);
6715 if (DTI != Dices.end()) {
6717 DTI->second.getLength(Length);
6719 DTI->second.getKind(Kind);
6720 Size = DumpDataInCode(Bytes.data() + Index, Length, Kind);
6721 if ((Kind == MachO::DICE_KIND_JUMP_TABLE8) &&
6722 (PC == (DTI->first + Length - 1)) && (Length & 1))
6727 SmallVector<char, 64> AnnotationsBytes;
6728 raw_svector_ostream Annotations(AnnotationsBytes);
6732 gotInst = ThumbDisAsm->getInstruction(Inst, Size, Bytes.slice(Index),
6733 PC, DebugOut, Annotations);
6735 gotInst = DisAsm->getInstruction(Inst, Size, Bytes.slice(Index), PC,
6736 DebugOut, Annotations);
6738 if (!NoShowRawInsn || Arch == Triple::arm) {
6739 dumpBytes(makeArrayRef(Bytes.data() + Index, Size), outs());
6741 formatted_raw_ostream FormattedOS(outs());
6742 StringRef AnnotationsStr = Annotations.str();
6744 ThumbIP->printInst(&Inst, FormattedOS, AnnotationsStr, *ThumbSTI);
6746 IP->printInst(&Inst, FormattedOS, AnnotationsStr, *STI);
6747 emitComments(CommentStream, CommentsToEmit, FormattedOS, *AsmInfo);
6749 // Print debug info.
6751 DILineInfo dli = diContext->getLineInfoForAddress(PC);
6752 // Print valid line info if it changed.
6753 if (dli != lastLine && dli.Line != 0)
6754 outs() << "\t## " << dli.FileName << ':' << dli.Line << ':'
6760 unsigned int Arch = MachOOF->getArch();
6761 if (Arch == Triple::x86_64 || Arch == Triple::x86) {
6762 outs() << format("\t.byte 0x%02x #bad opcode\n",
6763 *(Bytes.data() + Index) & 0xff);
6764 Size = 1; // skip exactly one illegible byte and move on.
6765 } else if (Arch == Triple::aarch64 ||
6766 (Arch == Triple::arm && !IsThumb)) {
6767 uint32_t opcode = (*(Bytes.data() + Index) & 0xff) |
6768 (*(Bytes.data() + Index + 1) & 0xff) << 8 |
6769 (*(Bytes.data() + Index + 2) & 0xff) << 16 |
6770 (*(Bytes.data() + Index + 3) & 0xff) << 24;
6771 outs() << format("\t.long\t0x%08x\n", opcode);
6773 } else if (Arch == Triple::arm) {
6774 assert(IsThumb && "ARM mode should have been dealt with above");
6775 uint32_t opcode = (*(Bytes.data() + Index) & 0xff) |
6776 (*(Bytes.data() + Index + 1) & 0xff) << 8;
6777 outs() << format("\t.short\t0x%04x\n", opcode);
6780 errs() << "llvm-objdump: warning: invalid instruction encoding\n";
6782 Size = 1; // skip illegible bytes
6787 if (!symbolTableWorked) {
6788 // Reading the symbol table didn't work, disassemble the whole section.
6789 uint64_t SectAddress = Sections[SectIdx].getAddress();
6790 uint64_t SectSize = Sections[SectIdx].getSize();
6792 for (uint64_t Index = 0; Index < SectSize; Index += InstSize) {
6795 uint64_t PC = SectAddress + Index;
6796 if (DisAsm->getInstruction(Inst, InstSize, Bytes.slice(Index), PC,
6797 DebugOut, nulls())) {
6798 if (!NoLeadingAddr) {
6799 if (FullLeadingAddr) {
6800 if (MachOOF->is64Bit())
6801 outs() << format("%016" PRIx64, PC);
6803 outs() << format("%08" PRIx64, PC);
6805 outs() << format("%8" PRIx64 ":", PC);
6808 if (!NoShowRawInsn || Arch == Triple::arm) {
6810 dumpBytes(makeArrayRef(Bytes.data() + Index, InstSize), outs());
6812 IP->printInst(&Inst, outs(), "", *STI);
6815 unsigned int Arch = MachOOF->getArch();
6816 if (Arch == Triple::x86_64 || Arch == Triple::x86) {
6817 outs() << format("\t.byte 0x%02x #bad opcode\n",
6818 *(Bytes.data() + Index) & 0xff);
6819 InstSize = 1; // skip exactly one illegible byte and move on.
6821 errs() << "llvm-objdump: warning: invalid instruction encoding\n";
6823 InstSize = 1; // skip illegible bytes
6828 // The TripleName's need to be reset if we are called again for a different
6831 ThumbTripleName = "";
6833 if (SymbolizerInfo.method != nullptr)
6834 free(SymbolizerInfo.method);
6835 if (SymbolizerInfo.demangled_name != nullptr)
6836 free(SymbolizerInfo.demangled_name);
6837 if (ThumbSymbolizerInfo.method != nullptr)
6838 free(ThumbSymbolizerInfo.method);
6839 if (ThumbSymbolizerInfo.demangled_name != nullptr)
6840 free(ThumbSymbolizerInfo.demangled_name);
6844 //===----------------------------------------------------------------------===//
6845 // __compact_unwind section dumping
6846 //===----------------------------------------------------------------------===//
6850 template <typename T> static uint64_t readNext(const char *&Buf) {
6851 using llvm::support::little;
6852 using llvm::support::unaligned;
6854 uint64_t Val = support::endian::read<T, little, unaligned>(Buf);
6859 struct CompactUnwindEntry {
6860 uint32_t OffsetInSection;
6862 uint64_t FunctionAddr;
6864 uint32_t CompactEncoding;
6865 uint64_t PersonalityAddr;
6868 RelocationRef FunctionReloc;
6869 RelocationRef PersonalityReloc;
6870 RelocationRef LSDAReloc;
6872 CompactUnwindEntry(StringRef Contents, unsigned Offset, bool Is64)
6873 : OffsetInSection(Offset) {
6875 read<uint64_t>(Contents.data() + Offset);
6877 read<uint32_t>(Contents.data() + Offset);
6881 template <typename UIntPtr> void read(const char *Buf) {
6882 FunctionAddr = readNext<UIntPtr>(Buf);
6883 Length = readNext<uint32_t>(Buf);
6884 CompactEncoding = readNext<uint32_t>(Buf);
6885 PersonalityAddr = readNext<UIntPtr>(Buf);
6886 LSDAAddr = readNext<UIntPtr>(Buf);
6891 /// Given a relocation from __compact_unwind, consisting of the RelocationRef
6892 /// and data being relocated, determine the best base Name and Addend to use for
6893 /// display purposes.
6895 /// 1. An Extern relocation will directly reference a symbol (and the data is
6896 /// then already an addend), so use that.
6897 /// 2. Otherwise the data is an offset in the object file's layout; try to find
6898 // a symbol before it in the same section, and use the offset from there.
6899 /// 3. Finally, if all that fails, fall back to an offset from the start of the
6900 /// referenced section.
6901 static void findUnwindRelocNameAddend(const MachOObjectFile *Obj,
6902 std::map<uint64_t, SymbolRef> &Symbols,
6903 const RelocationRef &Reloc, uint64_t Addr,
6904 StringRef &Name, uint64_t &Addend) {
6905 if (Reloc.getSymbol() != Obj->symbol_end()) {
6906 Expected<StringRef> NameOrErr = Reloc.getSymbol()->getName();
6908 report_error(Obj->getFileName(), NameOrErr.takeError());
6914 auto RE = Obj->getRelocation(Reloc.getRawDataRefImpl());
6915 SectionRef RelocSection = Obj->getAnyRelocationSection(RE);
6917 uint64_t SectionAddr = RelocSection.getAddress();
6919 auto Sym = Symbols.upper_bound(Addr);
6920 if (Sym == Symbols.begin()) {
6921 // The first symbol in the object is after this reference, the best we can
6922 // do is section-relative notation.
6923 RelocSection.getName(Name);
6924 Addend = Addr - SectionAddr;
6928 // Go back one so that SymbolAddress <= Addr.
6931 auto SectOrErr = Sym->second.getSection();
6933 report_error(Obj->getFileName(), SectOrErr.takeError());
6934 section_iterator SymSection = *SectOrErr;
6935 if (RelocSection == *SymSection) {
6936 // There's a valid symbol in the same section before this reference.
6937 Expected<StringRef> NameOrErr = Sym->second.getName();
6939 report_error(Obj->getFileName(), NameOrErr.takeError());
6941 Addend = Addr - Sym->first;
6945 // There is a symbol before this reference, but it's in a different
6946 // section. Probably not helpful to mention it, so use the section name.
6947 RelocSection.getName(Name);
6948 Addend = Addr - SectionAddr;
6951 static void printUnwindRelocDest(const MachOObjectFile *Obj,
6952 std::map<uint64_t, SymbolRef> &Symbols,
6953 const RelocationRef &Reloc, uint64_t Addr) {
6957 if (!Reloc.getObject())
6960 findUnwindRelocNameAddend(Obj, Symbols, Reloc, Addr, Name, Addend);
6964 outs() << " + " << format("0x%" PRIx64, Addend);
6968 printMachOCompactUnwindSection(const MachOObjectFile *Obj,
6969 std::map<uint64_t, SymbolRef> &Symbols,
6970 const SectionRef &CompactUnwind) {
6972 if (!Obj->isLittleEndian()) {
6973 outs() << "Skipping big-endian __compact_unwind section\n";
6977 bool Is64 = Obj->is64Bit();
6978 uint32_t PointerSize = Is64 ? sizeof(uint64_t) : sizeof(uint32_t);
6979 uint32_t EntrySize = 3 * PointerSize + 2 * sizeof(uint32_t);
6982 CompactUnwind.getContents(Contents);
6984 SmallVector<CompactUnwindEntry, 4> CompactUnwinds;
6986 // First populate the initial raw offsets, encodings and so on from the entry.
6987 for (unsigned Offset = 0; Offset < Contents.size(); Offset += EntrySize) {
6988 CompactUnwindEntry Entry(Contents.data(), Offset, Is64);
6989 CompactUnwinds.push_back(Entry);
6992 // Next we need to look at the relocations to find out what objects are
6993 // actually being referred to.
6994 for (const RelocationRef &Reloc : CompactUnwind.relocations()) {
6995 uint64_t RelocAddress = Reloc.getOffset();
6997 uint32_t EntryIdx = RelocAddress / EntrySize;
6998 uint32_t OffsetInEntry = RelocAddress - EntryIdx * EntrySize;
6999 CompactUnwindEntry &Entry = CompactUnwinds[EntryIdx];
7001 if (OffsetInEntry == 0)
7002 Entry.FunctionReloc = Reloc;
7003 else if (OffsetInEntry == PointerSize + 2 * sizeof(uint32_t))
7004 Entry.PersonalityReloc = Reloc;
7005 else if (OffsetInEntry == 2 * PointerSize + 2 * sizeof(uint32_t))
7006 Entry.LSDAReloc = Reloc;
7008 outs() << "Invalid relocation in __compact_unwind section\n";
7013 // Finally, we're ready to print the data we've gathered.
7014 outs() << "Contents of __compact_unwind section:\n";
7015 for (auto &Entry : CompactUnwinds) {
7016 outs() << " Entry at offset "
7017 << format("0x%" PRIx32, Entry.OffsetInSection) << ":\n";
7019 // 1. Start of the region this entry applies to.
7020 outs() << " start: " << format("0x%" PRIx64,
7021 Entry.FunctionAddr) << ' ';
7022 printUnwindRelocDest(Obj, Symbols, Entry.FunctionReloc, Entry.FunctionAddr);
7025 // 2. Length of the region this entry applies to.
7026 outs() << " length: " << format("0x%" PRIx32, Entry.Length)
7028 // 3. The 32-bit compact encoding.
7029 outs() << " compact encoding: "
7030 << format("0x%08" PRIx32, Entry.CompactEncoding) << '\n';
7032 // 4. The personality function, if present.
7033 if (Entry.PersonalityReloc.getObject()) {
7034 outs() << " personality function: "
7035 << format("0x%" PRIx64, Entry.PersonalityAddr) << ' ';
7036 printUnwindRelocDest(Obj, Symbols, Entry.PersonalityReloc,
7037 Entry.PersonalityAddr);
7041 // 5. This entry's language-specific data area.
7042 if (Entry.LSDAReloc.getObject()) {
7043 outs() << " LSDA: " << format("0x%" PRIx64,
7044 Entry.LSDAAddr) << ' ';
7045 printUnwindRelocDest(Obj, Symbols, Entry.LSDAReloc, Entry.LSDAAddr);
7051 //===----------------------------------------------------------------------===//
7052 // __unwind_info section dumping
7053 //===----------------------------------------------------------------------===//
7055 static void printRegularSecondLevelUnwindPage(const char *PageStart) {
7056 const char *Pos = PageStart;
7057 uint32_t Kind = readNext<uint32_t>(Pos);
7059 assert(Kind == 2 && "kind for a regular 2nd level index should be 2");
7061 uint16_t EntriesStart = readNext<uint16_t>(Pos);
7062 uint16_t NumEntries = readNext<uint16_t>(Pos);
7064 Pos = PageStart + EntriesStart;
7065 for (unsigned i = 0; i < NumEntries; ++i) {
7066 uint32_t FunctionOffset = readNext<uint32_t>(Pos);
7067 uint32_t Encoding = readNext<uint32_t>(Pos);
7069 outs() << " [" << i << "]: "
7070 << "function offset=" << format("0x%08" PRIx32, FunctionOffset)
7072 << "encoding=" << format("0x%08" PRIx32, Encoding) << '\n';
7076 static void printCompressedSecondLevelUnwindPage(
7077 const char *PageStart, uint32_t FunctionBase,
7078 const SmallVectorImpl<uint32_t> &CommonEncodings) {
7079 const char *Pos = PageStart;
7080 uint32_t Kind = readNext<uint32_t>(Pos);
7082 assert(Kind == 3 && "kind for a compressed 2nd level index should be 3");
7084 uint16_t EntriesStart = readNext<uint16_t>(Pos);
7085 uint16_t NumEntries = readNext<uint16_t>(Pos);
7087 uint16_t EncodingsStart = readNext<uint16_t>(Pos);
7088 readNext<uint16_t>(Pos);
7089 const auto *PageEncodings = reinterpret_cast<const support::ulittle32_t *>(
7090 PageStart + EncodingsStart);
7092 Pos = PageStart + EntriesStart;
7093 for (unsigned i = 0; i < NumEntries; ++i) {
7094 uint32_t Entry = readNext<uint32_t>(Pos);
7095 uint32_t FunctionOffset = FunctionBase + (Entry & 0xffffff);
7096 uint32_t EncodingIdx = Entry >> 24;
7099 if (EncodingIdx < CommonEncodings.size())
7100 Encoding = CommonEncodings[EncodingIdx];
7102 Encoding = PageEncodings[EncodingIdx - CommonEncodings.size()];
7104 outs() << " [" << i << "]: "
7105 << "function offset=" << format("0x%08" PRIx32, FunctionOffset)
7107 << "encoding[" << EncodingIdx
7108 << "]=" << format("0x%08" PRIx32, Encoding) << '\n';
7112 static void printMachOUnwindInfoSection(const MachOObjectFile *Obj,
7113 std::map<uint64_t, SymbolRef> &Symbols,
7114 const SectionRef &UnwindInfo) {
7116 if (!Obj->isLittleEndian()) {
7117 outs() << "Skipping big-endian __unwind_info section\n";
7121 outs() << "Contents of __unwind_info section:\n";
7124 UnwindInfo.getContents(Contents);
7125 const char *Pos = Contents.data();
7127 //===----------------------------------
7129 //===----------------------------------
7131 uint32_t Version = readNext<uint32_t>(Pos);
7132 outs() << " Version: "
7133 << format("0x%" PRIx32, Version) << '\n';
7135 outs() << " Skipping section with unknown version\n";
7139 uint32_t CommonEncodingsStart = readNext<uint32_t>(Pos);
7140 outs() << " Common encodings array section offset: "
7141 << format("0x%" PRIx32, CommonEncodingsStart) << '\n';
7142 uint32_t NumCommonEncodings = readNext<uint32_t>(Pos);
7143 outs() << " Number of common encodings in array: "
7144 << format("0x%" PRIx32, NumCommonEncodings) << '\n';
7146 uint32_t PersonalitiesStart = readNext<uint32_t>(Pos);
7147 outs() << " Personality function array section offset: "
7148 << format("0x%" PRIx32, PersonalitiesStart) << '\n';
7149 uint32_t NumPersonalities = readNext<uint32_t>(Pos);
7150 outs() << " Number of personality functions in array: "
7151 << format("0x%" PRIx32, NumPersonalities) << '\n';
7153 uint32_t IndicesStart = readNext<uint32_t>(Pos);
7154 outs() << " Index array section offset: "
7155 << format("0x%" PRIx32, IndicesStart) << '\n';
7156 uint32_t NumIndices = readNext<uint32_t>(Pos);
7157 outs() << " Number of indices in array: "
7158 << format("0x%" PRIx32, NumIndices) << '\n';
7160 //===----------------------------------
7161 // A shared list of common encodings
7162 //===----------------------------------
7164 // These occupy indices in the range [0, N] whenever an encoding is referenced
7165 // from a compressed 2nd level index table. In practice the linker only
7166 // creates ~128 of these, so that indices are available to embed encodings in
7167 // the 2nd level index.
7169 SmallVector<uint32_t, 64> CommonEncodings;
7170 outs() << " Common encodings: (count = " << NumCommonEncodings << ")\n";
7171 Pos = Contents.data() + CommonEncodingsStart;
7172 for (unsigned i = 0; i < NumCommonEncodings; ++i) {
7173 uint32_t Encoding = readNext<uint32_t>(Pos);
7174 CommonEncodings.push_back(Encoding);
7176 outs() << " encoding[" << i << "]: " << format("0x%08" PRIx32, Encoding)
7180 //===----------------------------------
7181 // Personality functions used in this executable
7182 //===----------------------------------
7184 // There should be only a handful of these (one per source language,
7185 // roughly). Particularly since they only get 2 bits in the compact encoding.
7187 outs() << " Personality functions: (count = " << NumPersonalities << ")\n";
7188 Pos = Contents.data() + PersonalitiesStart;
7189 for (unsigned i = 0; i < NumPersonalities; ++i) {
7190 uint32_t PersonalityFn = readNext<uint32_t>(Pos);
7191 outs() << " personality[" << i + 1
7192 << "]: " << format("0x%08" PRIx32, PersonalityFn) << '\n';
7195 //===----------------------------------
7196 // The level 1 index entries
7197 //===----------------------------------
7199 // These specify an approximate place to start searching for the more detailed
7200 // information, sorted by PC.
7203 uint32_t FunctionOffset;
7204 uint32_t SecondLevelPageStart;
7208 SmallVector<IndexEntry, 4> IndexEntries;
7210 outs() << " Top level indices: (count = " << NumIndices << ")\n";
7211 Pos = Contents.data() + IndicesStart;
7212 for (unsigned i = 0; i < NumIndices; ++i) {
7215 Entry.FunctionOffset = readNext<uint32_t>(Pos);
7216 Entry.SecondLevelPageStart = readNext<uint32_t>(Pos);
7217 Entry.LSDAStart = readNext<uint32_t>(Pos);
7218 IndexEntries.push_back(Entry);
7220 outs() << " [" << i << "]: "
7221 << "function offset=" << format("0x%08" PRIx32, Entry.FunctionOffset)
7223 << "2nd level page offset="
7224 << format("0x%08" PRIx32, Entry.SecondLevelPageStart) << ", "
7225 << "LSDA offset=" << format("0x%08" PRIx32, Entry.LSDAStart) << '\n';
7228 //===----------------------------------
7229 // Next come the LSDA tables
7230 //===----------------------------------
7232 // The LSDA layout is rather implicit: it's a contiguous array of entries from
7233 // the first top-level index's LSDAOffset to the last (sentinel).
7235 outs() << " LSDA descriptors:\n";
7236 Pos = Contents.data() + IndexEntries[0].LSDAStart;
7237 int NumLSDAs = (IndexEntries.back().LSDAStart - IndexEntries[0].LSDAStart) /
7238 (2 * sizeof(uint32_t));
7239 for (int i = 0; i < NumLSDAs; ++i) {
7240 uint32_t FunctionOffset = readNext<uint32_t>(Pos);
7241 uint32_t LSDAOffset = readNext<uint32_t>(Pos);
7242 outs() << " [" << i << "]: "
7243 << "function offset=" << format("0x%08" PRIx32, FunctionOffset)
7245 << "LSDA offset=" << format("0x%08" PRIx32, LSDAOffset) << '\n';
7248 //===----------------------------------
7249 // Finally, the 2nd level indices
7250 //===----------------------------------
7252 // Generally these are 4K in size, and have 2 possible forms:
7253 // + Regular stores up to 511 entries with disparate encodings
7254 // + Compressed stores up to 1021 entries if few enough compact encoding
7256 outs() << " Second level indices:\n";
7257 for (unsigned i = 0; i < IndexEntries.size() - 1; ++i) {
7258 // The final sentinel top-level index has no associated 2nd level page
7259 if (IndexEntries[i].SecondLevelPageStart == 0)
7262 outs() << " Second level index[" << i << "]: "
7263 << "offset in section="
7264 << format("0x%08" PRIx32, IndexEntries[i].SecondLevelPageStart)
7266 << "base function offset="
7267 << format("0x%08" PRIx32, IndexEntries[i].FunctionOffset) << '\n';
7269 Pos = Contents.data() + IndexEntries[i].SecondLevelPageStart;
7270 uint32_t Kind = *reinterpret_cast<const support::ulittle32_t *>(Pos);
7272 printRegularSecondLevelUnwindPage(Pos);
7274 printCompressedSecondLevelUnwindPage(Pos, IndexEntries[i].FunctionOffset,
7277 outs() << " Skipping 2nd level page with unknown kind " << Kind
7282 void llvm::printMachOUnwindInfo(const MachOObjectFile *Obj) {
7283 std::map<uint64_t, SymbolRef> Symbols;
7284 for (const SymbolRef &SymRef : Obj->symbols()) {
7285 // Discard any undefined or absolute symbols. They're not going to take part
7286 // in the convenience lookup for unwind info and just take up resources.
7287 auto SectOrErr = SymRef.getSection();
7289 // TODO: Actually report errors helpfully.
7290 consumeError(SectOrErr.takeError());
7293 section_iterator Section = *SectOrErr;
7294 if (Section == Obj->section_end())
7297 uint64_t Addr = SymRef.getValue();
7298 Symbols.insert(std::make_pair(Addr, SymRef));
7301 for (const SectionRef &Section : Obj->sections()) {
7303 Section.getName(SectName);
7304 if (SectName == "__compact_unwind")
7305 printMachOCompactUnwindSection(Obj, Symbols, Section);
7306 else if (SectName == "__unwind_info")
7307 printMachOUnwindInfoSection(Obj, Symbols, Section);
7311 static void PrintMachHeader(uint32_t magic, uint32_t cputype,
7312 uint32_t cpusubtype, uint32_t filetype,
7313 uint32_t ncmds, uint32_t sizeofcmds, uint32_t flags,
7315 outs() << "Mach header\n";
7316 outs() << " magic cputype cpusubtype caps filetype ncmds "
7317 "sizeofcmds flags\n";
7319 if (magic == MachO::MH_MAGIC)
7320 outs() << " MH_MAGIC";
7321 else if (magic == MachO::MH_MAGIC_64)
7322 outs() << "MH_MAGIC_64";
7324 outs() << format(" 0x%08" PRIx32, magic);
7326 case MachO::CPU_TYPE_I386:
7328 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
7329 case MachO::CPU_SUBTYPE_I386_ALL:
7333 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7337 case MachO::CPU_TYPE_X86_64:
7338 outs() << " X86_64";
7339 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
7340 case MachO::CPU_SUBTYPE_X86_64_ALL:
7343 case MachO::CPU_SUBTYPE_X86_64_H:
7344 outs() << " Haswell";
7347 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7351 case MachO::CPU_TYPE_ARM:
7353 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
7354 case MachO::CPU_SUBTYPE_ARM_ALL:
7357 case MachO::CPU_SUBTYPE_ARM_V4T:
7360 case MachO::CPU_SUBTYPE_ARM_V5TEJ:
7363 case MachO::CPU_SUBTYPE_ARM_XSCALE:
7364 outs() << " XSCALE";
7366 case MachO::CPU_SUBTYPE_ARM_V6:
7369 case MachO::CPU_SUBTYPE_ARM_V6M:
7372 case MachO::CPU_SUBTYPE_ARM_V7:
7375 case MachO::CPU_SUBTYPE_ARM_V7EM:
7378 case MachO::CPU_SUBTYPE_ARM_V7K:
7381 case MachO::CPU_SUBTYPE_ARM_V7M:
7384 case MachO::CPU_SUBTYPE_ARM_V7S:
7388 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7392 case MachO::CPU_TYPE_ARM64:
7394 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
7395 case MachO::CPU_SUBTYPE_ARM64_ALL:
7399 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7403 case MachO::CPU_TYPE_POWERPC:
7405 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
7406 case MachO::CPU_SUBTYPE_POWERPC_ALL:
7410 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7414 case MachO::CPU_TYPE_POWERPC64:
7416 switch (cpusubtype & ~MachO::CPU_SUBTYPE_MASK) {
7417 case MachO::CPU_SUBTYPE_POWERPC_ALL:
7421 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7426 outs() << format(" %7d", cputype);
7427 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7430 if ((cpusubtype & MachO::CPU_SUBTYPE_MASK) == MachO::CPU_SUBTYPE_LIB64) {
7433 outs() << format(" 0x%02" PRIx32,
7434 (cpusubtype & MachO::CPU_SUBTYPE_MASK) >> 24);
7437 case MachO::MH_OBJECT:
7438 outs() << " OBJECT";
7440 case MachO::MH_EXECUTE:
7441 outs() << " EXECUTE";
7443 case MachO::MH_FVMLIB:
7444 outs() << " FVMLIB";
7446 case MachO::MH_CORE:
7449 case MachO::MH_PRELOAD:
7450 outs() << " PRELOAD";
7452 case MachO::MH_DYLIB:
7455 case MachO::MH_DYLIB_STUB:
7456 outs() << " DYLIB_STUB";
7458 case MachO::MH_DYLINKER:
7459 outs() << " DYLINKER";
7461 case MachO::MH_BUNDLE:
7462 outs() << " BUNDLE";
7464 case MachO::MH_DSYM:
7467 case MachO::MH_KEXT_BUNDLE:
7468 outs() << " KEXTBUNDLE";
7471 outs() << format(" %10u", filetype);
7474 outs() << format(" %5u", ncmds);
7475 outs() << format(" %10u", sizeofcmds);
7477 if (f & MachO::MH_NOUNDEFS) {
7478 outs() << " NOUNDEFS";
7479 f &= ~MachO::MH_NOUNDEFS;
7481 if (f & MachO::MH_INCRLINK) {
7482 outs() << " INCRLINK";
7483 f &= ~MachO::MH_INCRLINK;
7485 if (f & MachO::MH_DYLDLINK) {
7486 outs() << " DYLDLINK";
7487 f &= ~MachO::MH_DYLDLINK;
7489 if (f & MachO::MH_BINDATLOAD) {
7490 outs() << " BINDATLOAD";
7491 f &= ~MachO::MH_BINDATLOAD;
7493 if (f & MachO::MH_PREBOUND) {
7494 outs() << " PREBOUND";
7495 f &= ~MachO::MH_PREBOUND;
7497 if (f & MachO::MH_SPLIT_SEGS) {
7498 outs() << " SPLIT_SEGS";
7499 f &= ~MachO::MH_SPLIT_SEGS;
7501 if (f & MachO::MH_LAZY_INIT) {
7502 outs() << " LAZY_INIT";
7503 f &= ~MachO::MH_LAZY_INIT;
7505 if (f & MachO::MH_TWOLEVEL) {
7506 outs() << " TWOLEVEL";
7507 f &= ~MachO::MH_TWOLEVEL;
7509 if (f & MachO::MH_FORCE_FLAT) {
7510 outs() << " FORCE_FLAT";
7511 f &= ~MachO::MH_FORCE_FLAT;
7513 if (f & MachO::MH_NOMULTIDEFS) {
7514 outs() << " NOMULTIDEFS";
7515 f &= ~MachO::MH_NOMULTIDEFS;
7517 if (f & MachO::MH_NOFIXPREBINDING) {
7518 outs() << " NOFIXPREBINDING";
7519 f &= ~MachO::MH_NOFIXPREBINDING;
7521 if (f & MachO::MH_PREBINDABLE) {
7522 outs() << " PREBINDABLE";
7523 f &= ~MachO::MH_PREBINDABLE;
7525 if (f & MachO::MH_ALLMODSBOUND) {
7526 outs() << " ALLMODSBOUND";
7527 f &= ~MachO::MH_ALLMODSBOUND;
7529 if (f & MachO::MH_SUBSECTIONS_VIA_SYMBOLS) {
7530 outs() << " SUBSECTIONS_VIA_SYMBOLS";
7531 f &= ~MachO::MH_SUBSECTIONS_VIA_SYMBOLS;
7533 if (f & MachO::MH_CANONICAL) {
7534 outs() << " CANONICAL";
7535 f &= ~MachO::MH_CANONICAL;
7537 if (f & MachO::MH_WEAK_DEFINES) {
7538 outs() << " WEAK_DEFINES";
7539 f &= ~MachO::MH_WEAK_DEFINES;
7541 if (f & MachO::MH_BINDS_TO_WEAK) {
7542 outs() << " BINDS_TO_WEAK";
7543 f &= ~MachO::MH_BINDS_TO_WEAK;
7545 if (f & MachO::MH_ALLOW_STACK_EXECUTION) {
7546 outs() << " ALLOW_STACK_EXECUTION";
7547 f &= ~MachO::MH_ALLOW_STACK_EXECUTION;
7549 if (f & MachO::MH_DEAD_STRIPPABLE_DYLIB) {
7550 outs() << " DEAD_STRIPPABLE_DYLIB";
7551 f &= ~MachO::MH_DEAD_STRIPPABLE_DYLIB;
7553 if (f & MachO::MH_PIE) {
7555 f &= ~MachO::MH_PIE;
7557 if (f & MachO::MH_NO_REEXPORTED_DYLIBS) {
7558 outs() << " NO_REEXPORTED_DYLIBS";
7559 f &= ~MachO::MH_NO_REEXPORTED_DYLIBS;
7561 if (f & MachO::MH_HAS_TLV_DESCRIPTORS) {
7562 outs() << " MH_HAS_TLV_DESCRIPTORS";
7563 f &= ~MachO::MH_HAS_TLV_DESCRIPTORS;
7565 if (f & MachO::MH_NO_HEAP_EXECUTION) {
7566 outs() << " MH_NO_HEAP_EXECUTION";
7567 f &= ~MachO::MH_NO_HEAP_EXECUTION;
7569 if (f & MachO::MH_APP_EXTENSION_SAFE) {
7570 outs() << " APP_EXTENSION_SAFE";
7571 f &= ~MachO::MH_APP_EXTENSION_SAFE;
7573 if (f != 0 || flags == 0)
7574 outs() << format(" 0x%08" PRIx32, f);
7576 outs() << format(" 0x%08" PRIx32, magic);
7577 outs() << format(" %7d", cputype);
7578 outs() << format(" %10d", cpusubtype & ~MachO::CPU_SUBTYPE_MASK);
7579 outs() << format(" 0x%02" PRIx32,
7580 (cpusubtype & MachO::CPU_SUBTYPE_MASK) >> 24);
7581 outs() << format(" %10u", filetype);
7582 outs() << format(" %5u", ncmds);
7583 outs() << format(" %10u", sizeofcmds);
7584 outs() << format(" 0x%08" PRIx32, flags);
7589 static void PrintSegmentCommand(uint32_t cmd, uint32_t cmdsize,
7590 StringRef SegName, uint64_t vmaddr,
7591 uint64_t vmsize, uint64_t fileoff,
7592 uint64_t filesize, uint32_t maxprot,
7593 uint32_t initprot, uint32_t nsects,
7594 uint32_t flags, uint32_t object_size,
7596 uint64_t expected_cmdsize;
7597 if (cmd == MachO::LC_SEGMENT) {
7598 outs() << " cmd LC_SEGMENT\n";
7599 expected_cmdsize = nsects;
7600 expected_cmdsize *= sizeof(struct MachO::section);
7601 expected_cmdsize += sizeof(struct MachO::segment_command);
7603 outs() << " cmd LC_SEGMENT_64\n";
7604 expected_cmdsize = nsects;
7605 expected_cmdsize *= sizeof(struct MachO::section_64);
7606 expected_cmdsize += sizeof(struct MachO::segment_command_64);
7608 outs() << " cmdsize " << cmdsize;
7609 if (cmdsize != expected_cmdsize)
7610 outs() << " Inconsistent size\n";
7613 outs() << " segname " << SegName << "\n";
7614 if (cmd == MachO::LC_SEGMENT_64) {
7615 outs() << " vmaddr " << format("0x%016" PRIx64, vmaddr) << "\n";
7616 outs() << " vmsize " << format("0x%016" PRIx64, vmsize) << "\n";
7618 outs() << " vmaddr " << format("0x%08" PRIx64, vmaddr) << "\n";
7619 outs() << " vmsize " << format("0x%08" PRIx64, vmsize) << "\n";
7621 outs() << " fileoff " << fileoff;
7622 if (fileoff > object_size)
7623 outs() << " (past end of file)\n";
7626 outs() << " filesize " << filesize;
7627 if (fileoff + filesize > object_size)
7628 outs() << " (past end of file)\n";
7633 ~(MachO::VM_PROT_READ | MachO::VM_PROT_WRITE |
7634 MachO::VM_PROT_EXECUTE)) != 0)
7635 outs() << " maxprot ?" << format("0x%08" PRIx32, maxprot) << "\n";
7637 outs() << " maxprot ";
7638 outs() << ((maxprot & MachO::VM_PROT_READ) ? "r" : "-");
7639 outs() << ((maxprot & MachO::VM_PROT_WRITE) ? "w" : "-");
7640 outs() << ((maxprot & MachO::VM_PROT_EXECUTE) ? "x\n" : "-\n");
7643 ~(MachO::VM_PROT_READ | MachO::VM_PROT_WRITE |
7644 MachO::VM_PROT_EXECUTE)) != 0)
7645 outs() << " initprot ?" << format("0x%08" PRIx32, initprot) << "\n";
7647 outs() << " initprot ";
7648 outs() << ((initprot & MachO::VM_PROT_READ) ? "r" : "-");
7649 outs() << ((initprot & MachO::VM_PROT_WRITE) ? "w" : "-");
7650 outs() << ((initprot & MachO::VM_PROT_EXECUTE) ? "x\n" : "-\n");
7653 outs() << " maxprot " << format("0x%08" PRIx32, maxprot) << "\n";
7654 outs() << " initprot " << format("0x%08" PRIx32, initprot) << "\n";
7656 outs() << " nsects " << nsects << "\n";
7660 outs() << " (none)\n";
7662 if (flags & MachO::SG_HIGHVM) {
7663 outs() << " HIGHVM";
7664 flags &= ~MachO::SG_HIGHVM;
7666 if (flags & MachO::SG_FVMLIB) {
7667 outs() << " FVMLIB";
7668 flags &= ~MachO::SG_FVMLIB;
7670 if (flags & MachO::SG_NORELOC) {
7671 outs() << " NORELOC";
7672 flags &= ~MachO::SG_NORELOC;
7674 if (flags & MachO::SG_PROTECTED_VERSION_1) {
7675 outs() << " PROTECTED_VERSION_1";
7676 flags &= ~MachO::SG_PROTECTED_VERSION_1;
7679 outs() << format(" 0x%08" PRIx32, flags) << " (unknown flags)\n";
7684 outs() << " flags " << format("0x%" PRIx32, flags) << "\n";
7688 static void PrintSection(const char *sectname, const char *segname,
7689 uint64_t addr, uint64_t size, uint32_t offset,
7690 uint32_t align, uint32_t reloff, uint32_t nreloc,
7691 uint32_t flags, uint32_t reserved1, uint32_t reserved2,
7692 uint32_t cmd, const char *sg_segname,
7693 uint32_t filetype, uint32_t object_size,
7695 outs() << "Section\n";
7696 outs() << " sectname " << format("%.16s\n", sectname);
7697 outs() << " segname " << format("%.16s", segname);
7698 if (filetype != MachO::MH_OBJECT && strncmp(sg_segname, segname, 16) != 0)
7699 outs() << " (does not match segment)\n";
7702 if (cmd == MachO::LC_SEGMENT_64) {
7703 outs() << " addr " << format("0x%016" PRIx64, addr) << "\n";
7704 outs() << " size " << format("0x%016" PRIx64, size);
7706 outs() << " addr " << format("0x%08" PRIx64, addr) << "\n";
7707 outs() << " size " << format("0x%08" PRIx64, size);
7709 if ((flags & MachO::S_ZEROFILL) != 0 && offset + size > object_size)
7710 outs() << " (past end of file)\n";
7713 outs() << " offset " << offset;
7714 if (offset > object_size)
7715 outs() << " (past end of file)\n";
7718 uint32_t align_shifted = 1 << align;
7719 outs() << " align 2^" << align << " (" << align_shifted << ")\n";
7720 outs() << " reloff " << reloff;
7721 if (reloff > object_size)
7722 outs() << " (past end of file)\n";
7725 outs() << " nreloc " << nreloc;
7726 if (reloff + nreloc * sizeof(struct MachO::relocation_info) > object_size)
7727 outs() << " (past end of file)\n";
7730 uint32_t section_type = flags & MachO::SECTION_TYPE;
7733 if (section_type == MachO::S_REGULAR)
7734 outs() << " S_REGULAR\n";
7735 else if (section_type == MachO::S_ZEROFILL)
7736 outs() << " S_ZEROFILL\n";
7737 else if (section_type == MachO::S_CSTRING_LITERALS)
7738 outs() << " S_CSTRING_LITERALS\n";
7739 else if (section_type == MachO::S_4BYTE_LITERALS)
7740 outs() << " S_4BYTE_LITERALS\n";
7741 else if (section_type == MachO::S_8BYTE_LITERALS)
7742 outs() << " S_8BYTE_LITERALS\n";
7743 else if (section_type == MachO::S_16BYTE_LITERALS)
7744 outs() << " S_16BYTE_LITERALS\n";
7745 else if (section_type == MachO::S_LITERAL_POINTERS)
7746 outs() << " S_LITERAL_POINTERS\n";
7747 else if (section_type == MachO::S_NON_LAZY_SYMBOL_POINTERS)
7748 outs() << " S_NON_LAZY_SYMBOL_POINTERS\n";
7749 else if (section_type == MachO::S_LAZY_SYMBOL_POINTERS)
7750 outs() << " S_LAZY_SYMBOL_POINTERS\n";
7751 else if (section_type == MachO::S_SYMBOL_STUBS)
7752 outs() << " S_SYMBOL_STUBS\n";
7753 else if (section_type == MachO::S_MOD_INIT_FUNC_POINTERS)
7754 outs() << " S_MOD_INIT_FUNC_POINTERS\n";
7755 else if (section_type == MachO::S_MOD_TERM_FUNC_POINTERS)
7756 outs() << " S_MOD_TERM_FUNC_POINTERS\n";
7757 else if (section_type == MachO::S_COALESCED)
7758 outs() << " S_COALESCED\n";
7759 else if (section_type == MachO::S_INTERPOSING)
7760 outs() << " S_INTERPOSING\n";
7761 else if (section_type == MachO::S_DTRACE_DOF)
7762 outs() << " S_DTRACE_DOF\n";
7763 else if (section_type == MachO::S_LAZY_DYLIB_SYMBOL_POINTERS)
7764 outs() << " S_LAZY_DYLIB_SYMBOL_POINTERS\n";
7765 else if (section_type == MachO::S_THREAD_LOCAL_REGULAR)
7766 outs() << " S_THREAD_LOCAL_REGULAR\n";
7767 else if (section_type == MachO::S_THREAD_LOCAL_ZEROFILL)
7768 outs() << " S_THREAD_LOCAL_ZEROFILL\n";
7769 else if (section_type == MachO::S_THREAD_LOCAL_VARIABLES)
7770 outs() << " S_THREAD_LOCAL_VARIABLES\n";
7771 else if (section_type == MachO::S_THREAD_LOCAL_VARIABLE_POINTERS)
7772 outs() << " S_THREAD_LOCAL_VARIABLE_POINTERS\n";
7773 else if (section_type == MachO::S_THREAD_LOCAL_INIT_FUNCTION_POINTERS)
7774 outs() << " S_THREAD_LOCAL_INIT_FUNCTION_POINTERS\n";
7776 outs() << format("0x%08" PRIx32, section_type) << "\n";
7777 outs() << "attributes";
7778 uint32_t section_attributes = flags & MachO::SECTION_ATTRIBUTES;
7779 if (section_attributes & MachO::S_ATTR_PURE_INSTRUCTIONS)
7780 outs() << " PURE_INSTRUCTIONS";
7781 if (section_attributes & MachO::S_ATTR_NO_TOC)
7782 outs() << " NO_TOC";
7783 if (section_attributes & MachO::S_ATTR_STRIP_STATIC_SYMS)
7784 outs() << " STRIP_STATIC_SYMS";
7785 if (section_attributes & MachO::S_ATTR_NO_DEAD_STRIP)
7786 outs() << " NO_DEAD_STRIP";
7787 if (section_attributes & MachO::S_ATTR_LIVE_SUPPORT)
7788 outs() << " LIVE_SUPPORT";
7789 if (section_attributes & MachO::S_ATTR_SELF_MODIFYING_CODE)
7790 outs() << " SELF_MODIFYING_CODE";
7791 if (section_attributes & MachO::S_ATTR_DEBUG)
7793 if (section_attributes & MachO::S_ATTR_SOME_INSTRUCTIONS)
7794 outs() << " SOME_INSTRUCTIONS";
7795 if (section_attributes & MachO::S_ATTR_EXT_RELOC)
7796 outs() << " EXT_RELOC";
7797 if (section_attributes & MachO::S_ATTR_LOC_RELOC)
7798 outs() << " LOC_RELOC";
7799 if (section_attributes == 0)
7800 outs() << " (none)";
7803 outs() << " flags " << format("0x%08" PRIx32, flags) << "\n";
7804 outs() << " reserved1 " << reserved1;
7805 if (section_type == MachO::S_SYMBOL_STUBS ||
7806 section_type == MachO::S_LAZY_SYMBOL_POINTERS ||
7807 section_type == MachO::S_LAZY_DYLIB_SYMBOL_POINTERS ||
7808 section_type == MachO::S_NON_LAZY_SYMBOL_POINTERS ||
7809 section_type == MachO::S_THREAD_LOCAL_VARIABLE_POINTERS)
7810 outs() << " (index into indirect symbol table)\n";
7813 outs() << " reserved2 " << reserved2;
7814 if (section_type == MachO::S_SYMBOL_STUBS)
7815 outs() << " (size of stubs)\n";
7820 static void PrintSymtabLoadCommand(MachO::symtab_command st, bool Is64Bit,
7821 uint32_t object_size) {
7822 outs() << " cmd LC_SYMTAB\n";
7823 outs() << " cmdsize " << st.cmdsize;
7824 if (st.cmdsize != sizeof(struct MachO::symtab_command))
7825 outs() << " Incorrect size\n";
7828 outs() << " symoff " << st.symoff;
7829 if (st.symoff > object_size)
7830 outs() << " (past end of file)\n";
7833 outs() << " nsyms " << st.nsyms;
7836 big_size = st.nsyms;
7837 big_size *= sizeof(struct MachO::nlist_64);
7838 big_size += st.symoff;
7839 if (big_size > object_size)
7840 outs() << " (past end of file)\n";
7844 big_size = st.nsyms;
7845 big_size *= sizeof(struct MachO::nlist);
7846 big_size += st.symoff;
7847 if (big_size > object_size)
7848 outs() << " (past end of file)\n";
7852 outs() << " stroff " << st.stroff;
7853 if (st.stroff > object_size)
7854 outs() << " (past end of file)\n";
7857 outs() << " strsize " << st.strsize;
7858 big_size = st.stroff;
7859 big_size += st.strsize;
7860 if (big_size > object_size)
7861 outs() << " (past end of file)\n";
7866 static void PrintDysymtabLoadCommand(MachO::dysymtab_command dyst,
7867 uint32_t nsyms, uint32_t object_size,
7869 outs() << " cmd LC_DYSYMTAB\n";
7870 outs() << " cmdsize " << dyst.cmdsize;
7871 if (dyst.cmdsize != sizeof(struct MachO::dysymtab_command))
7872 outs() << " Incorrect size\n";
7875 outs() << " ilocalsym " << dyst.ilocalsym;
7876 if (dyst.ilocalsym > nsyms)
7877 outs() << " (greater than the number of symbols)\n";
7880 outs() << " nlocalsym " << dyst.nlocalsym;
7882 big_size = dyst.ilocalsym;
7883 big_size += dyst.nlocalsym;
7884 if (big_size > nsyms)
7885 outs() << " (past the end of the symbol table)\n";
7888 outs() << " iextdefsym " << dyst.iextdefsym;
7889 if (dyst.iextdefsym > nsyms)
7890 outs() << " (greater than the number of symbols)\n";
7893 outs() << " nextdefsym " << dyst.nextdefsym;
7894 big_size = dyst.iextdefsym;
7895 big_size += dyst.nextdefsym;
7896 if (big_size > nsyms)
7897 outs() << " (past the end of the symbol table)\n";
7900 outs() << " iundefsym " << dyst.iundefsym;
7901 if (dyst.iundefsym > nsyms)
7902 outs() << " (greater than the number of symbols)\n";
7905 outs() << " nundefsym " << dyst.nundefsym;
7906 big_size = dyst.iundefsym;
7907 big_size += dyst.nundefsym;
7908 if (big_size > nsyms)
7909 outs() << " (past the end of the symbol table)\n";
7912 outs() << " tocoff " << dyst.tocoff;
7913 if (dyst.tocoff > object_size)
7914 outs() << " (past end of file)\n";
7917 outs() << " ntoc " << dyst.ntoc;
7918 big_size = dyst.ntoc;
7919 big_size *= sizeof(struct MachO::dylib_table_of_contents);
7920 big_size += dyst.tocoff;
7921 if (big_size > object_size)
7922 outs() << " (past end of file)\n";
7925 outs() << " modtaboff " << dyst.modtaboff;
7926 if (dyst.modtaboff > object_size)
7927 outs() << " (past end of file)\n";
7930 outs() << " nmodtab " << dyst.nmodtab;
7933 modtabend = dyst.nmodtab;
7934 modtabend *= sizeof(struct MachO::dylib_module_64);
7935 modtabend += dyst.modtaboff;
7937 modtabend = dyst.nmodtab;
7938 modtabend *= sizeof(struct MachO::dylib_module);
7939 modtabend += dyst.modtaboff;
7941 if (modtabend > object_size)
7942 outs() << " (past end of file)\n";
7945 outs() << " extrefsymoff " << dyst.extrefsymoff;
7946 if (dyst.extrefsymoff > object_size)
7947 outs() << " (past end of file)\n";
7950 outs() << " nextrefsyms " << dyst.nextrefsyms;
7951 big_size = dyst.nextrefsyms;
7952 big_size *= sizeof(struct MachO::dylib_reference);
7953 big_size += dyst.extrefsymoff;
7954 if (big_size > object_size)
7955 outs() << " (past end of file)\n";
7958 outs() << " indirectsymoff " << dyst.indirectsymoff;
7959 if (dyst.indirectsymoff > object_size)
7960 outs() << " (past end of file)\n";
7963 outs() << " nindirectsyms " << dyst.nindirectsyms;
7964 big_size = dyst.nindirectsyms;
7965 big_size *= sizeof(uint32_t);
7966 big_size += dyst.indirectsymoff;
7967 if (big_size > object_size)
7968 outs() << " (past end of file)\n";
7971 outs() << " extreloff " << dyst.extreloff;
7972 if (dyst.extreloff > object_size)
7973 outs() << " (past end of file)\n";
7976 outs() << " nextrel " << dyst.nextrel;
7977 big_size = dyst.nextrel;
7978 big_size *= sizeof(struct MachO::relocation_info);
7979 big_size += dyst.extreloff;
7980 if (big_size > object_size)
7981 outs() << " (past end of file)\n";
7984 outs() << " locreloff " << dyst.locreloff;
7985 if (dyst.locreloff > object_size)
7986 outs() << " (past end of file)\n";
7989 outs() << " nlocrel " << dyst.nlocrel;
7990 big_size = dyst.nlocrel;
7991 big_size *= sizeof(struct MachO::relocation_info);
7992 big_size += dyst.locreloff;
7993 if (big_size > object_size)
7994 outs() << " (past end of file)\n";
7999 static void PrintDyldInfoLoadCommand(MachO::dyld_info_command dc,
8000 uint32_t object_size) {
8001 if (dc.cmd == MachO::LC_DYLD_INFO)
8002 outs() << " cmd LC_DYLD_INFO\n";
8004 outs() << " cmd LC_DYLD_INFO_ONLY\n";
8005 outs() << " cmdsize " << dc.cmdsize;
8006 if (dc.cmdsize != sizeof(struct MachO::dyld_info_command))
8007 outs() << " Incorrect size\n";
8010 outs() << " rebase_off " << dc.rebase_off;
8011 if (dc.rebase_off > object_size)
8012 outs() << " (past end of file)\n";
8015 outs() << " rebase_size " << dc.rebase_size;
8017 big_size = dc.rebase_off;
8018 big_size += dc.rebase_size;
8019 if (big_size > object_size)
8020 outs() << " (past end of file)\n";
8023 outs() << " bind_off " << dc.bind_off;
8024 if (dc.bind_off > object_size)
8025 outs() << " (past end of file)\n";
8028 outs() << " bind_size " << dc.bind_size;
8029 big_size = dc.bind_off;
8030 big_size += dc.bind_size;
8031 if (big_size > object_size)
8032 outs() << " (past end of file)\n";
8035 outs() << " weak_bind_off " << dc.weak_bind_off;
8036 if (dc.weak_bind_off > object_size)
8037 outs() << " (past end of file)\n";
8040 outs() << " weak_bind_size " << dc.weak_bind_size;
8041 big_size = dc.weak_bind_off;
8042 big_size += dc.weak_bind_size;
8043 if (big_size > object_size)
8044 outs() << " (past end of file)\n";
8047 outs() << " lazy_bind_off " << dc.lazy_bind_off;
8048 if (dc.lazy_bind_off > object_size)
8049 outs() << " (past end of file)\n";
8052 outs() << " lazy_bind_size " << dc.lazy_bind_size;
8053 big_size = dc.lazy_bind_off;
8054 big_size += dc.lazy_bind_size;
8055 if (big_size > object_size)
8056 outs() << " (past end of file)\n";
8059 outs() << " export_off " << dc.export_off;
8060 if (dc.export_off > object_size)
8061 outs() << " (past end of file)\n";
8064 outs() << " export_size " << dc.export_size;
8065 big_size = dc.export_off;
8066 big_size += dc.export_size;
8067 if (big_size > object_size)
8068 outs() << " (past end of file)\n";
8073 static void PrintDyldLoadCommand(MachO::dylinker_command dyld,
8075 if (dyld.cmd == MachO::LC_ID_DYLINKER)
8076 outs() << " cmd LC_ID_DYLINKER\n";
8077 else if (dyld.cmd == MachO::LC_LOAD_DYLINKER)
8078 outs() << " cmd LC_LOAD_DYLINKER\n";
8079 else if (dyld.cmd == MachO::LC_DYLD_ENVIRONMENT)
8080 outs() << " cmd LC_DYLD_ENVIRONMENT\n";
8082 outs() << " cmd ?(" << dyld.cmd << ")\n";
8083 outs() << " cmdsize " << dyld.cmdsize;
8084 if (dyld.cmdsize < sizeof(struct MachO::dylinker_command))
8085 outs() << " Incorrect size\n";
8088 if (dyld.name >= dyld.cmdsize)
8089 outs() << " name ?(bad offset " << dyld.name << ")\n";
8091 const char *P = (const char *)(Ptr) + dyld.name;
8092 outs() << " name " << P << " (offset " << dyld.name << ")\n";
8096 static void PrintUuidLoadCommand(MachO::uuid_command uuid) {
8097 outs() << " cmd LC_UUID\n";
8098 outs() << " cmdsize " << uuid.cmdsize;
8099 if (uuid.cmdsize != sizeof(struct MachO::uuid_command))
8100 outs() << " Incorrect size\n";
8104 for (int i = 0; i < 16; ++i) {
8105 outs() << format("%02" PRIX32, uuid.uuid[i]);
8106 if (i == 3 || i == 5 || i == 7 || i == 9)
8112 static void PrintRpathLoadCommand(MachO::rpath_command rpath, const char *Ptr) {
8113 outs() << " cmd LC_RPATH\n";
8114 outs() << " cmdsize " << rpath.cmdsize;
8115 if (rpath.cmdsize < sizeof(struct MachO::rpath_command))
8116 outs() << " Incorrect size\n";
8119 if (rpath.path >= rpath.cmdsize)
8120 outs() << " path ?(bad offset " << rpath.path << ")\n";
8122 const char *P = (const char *)(Ptr) + rpath.path;
8123 outs() << " path " << P << " (offset " << rpath.path << ")\n";
8127 static void PrintVersionMinLoadCommand(MachO::version_min_command vd) {
8128 StringRef LoadCmdName;
8130 case MachO::LC_VERSION_MIN_MACOSX:
8131 LoadCmdName = "LC_VERSION_MIN_MACOSX";
8133 case MachO::LC_VERSION_MIN_IPHONEOS:
8134 LoadCmdName = "LC_VERSION_MIN_IPHONEOS";
8136 case MachO::LC_VERSION_MIN_TVOS:
8137 LoadCmdName = "LC_VERSION_MIN_TVOS";
8139 case MachO::LC_VERSION_MIN_WATCHOS:
8140 LoadCmdName = "LC_VERSION_MIN_WATCHOS";
8143 llvm_unreachable("Unknown version min load command");
8146 outs() << " cmd " << LoadCmdName << '\n';
8147 outs() << " cmdsize " << vd.cmdsize;
8148 if (vd.cmdsize != sizeof(struct MachO::version_min_command))
8149 outs() << " Incorrect size\n";
8152 outs() << " version "
8153 << MachOObjectFile::getVersionMinMajor(vd, false) << "."
8154 << MachOObjectFile::getVersionMinMinor(vd, false);
8155 uint32_t Update = MachOObjectFile::getVersionMinUpdate(vd, false);
8157 outs() << "." << Update;
8160 outs() << " sdk n/a";
8163 << MachOObjectFile::getVersionMinMajor(vd, true) << "."
8164 << MachOObjectFile::getVersionMinMinor(vd, true);
8166 Update = MachOObjectFile::getVersionMinUpdate(vd, true);
8168 outs() << "." << Update;
8172 static void PrintSourceVersionCommand(MachO::source_version_command sd) {
8173 outs() << " cmd LC_SOURCE_VERSION\n";
8174 outs() << " cmdsize " << sd.cmdsize;
8175 if (sd.cmdsize != sizeof(struct MachO::source_version_command))
8176 outs() << " Incorrect size\n";
8179 uint64_t a = (sd.version >> 40) & 0xffffff;
8180 uint64_t b = (sd.version >> 30) & 0x3ff;
8181 uint64_t c = (sd.version >> 20) & 0x3ff;
8182 uint64_t d = (sd.version >> 10) & 0x3ff;
8183 uint64_t e = sd.version & 0x3ff;
8184 outs() << " version " << a << "." << b;
8186 outs() << "." << c << "." << d << "." << e;
8188 outs() << "." << c << "." << d;
8194 static void PrintEntryPointCommand(MachO::entry_point_command ep) {
8195 outs() << " cmd LC_MAIN\n";
8196 outs() << " cmdsize " << ep.cmdsize;
8197 if (ep.cmdsize != sizeof(struct MachO::entry_point_command))
8198 outs() << " Incorrect size\n";
8201 outs() << " entryoff " << ep.entryoff << "\n";
8202 outs() << " stacksize " << ep.stacksize << "\n";
8205 static void PrintEncryptionInfoCommand(MachO::encryption_info_command ec,
8206 uint32_t object_size) {
8207 outs() << " cmd LC_ENCRYPTION_INFO\n";
8208 outs() << " cmdsize " << ec.cmdsize;
8209 if (ec.cmdsize != sizeof(struct MachO::encryption_info_command))
8210 outs() << " Incorrect size\n";
8213 outs() << " cryptoff " << ec.cryptoff;
8214 if (ec.cryptoff > object_size)
8215 outs() << " (past end of file)\n";
8218 outs() << " cryptsize " << ec.cryptsize;
8219 if (ec.cryptsize > object_size)
8220 outs() << " (past end of file)\n";
8223 outs() << " cryptid " << ec.cryptid << "\n";
8226 static void PrintEncryptionInfoCommand64(MachO::encryption_info_command_64 ec,
8227 uint32_t object_size) {
8228 outs() << " cmd LC_ENCRYPTION_INFO_64\n";
8229 outs() << " cmdsize " << ec.cmdsize;
8230 if (ec.cmdsize != sizeof(struct MachO::encryption_info_command_64))
8231 outs() << " Incorrect size\n";
8234 outs() << " cryptoff " << ec.cryptoff;
8235 if (ec.cryptoff > object_size)
8236 outs() << " (past end of file)\n";
8239 outs() << " cryptsize " << ec.cryptsize;
8240 if (ec.cryptsize > object_size)
8241 outs() << " (past end of file)\n";
8244 outs() << " cryptid " << ec.cryptid << "\n";
8245 outs() << " pad " << ec.pad << "\n";
8248 static void PrintLinkerOptionCommand(MachO::linker_option_command lo,
8250 outs() << " cmd LC_LINKER_OPTION\n";
8251 outs() << " cmdsize " << lo.cmdsize;
8252 if (lo.cmdsize < sizeof(struct MachO::linker_option_command))
8253 outs() << " Incorrect size\n";
8256 outs() << " count " << lo.count << "\n";
8257 const char *string = Ptr + sizeof(struct MachO::linker_option_command);
8258 uint32_t left = lo.cmdsize - sizeof(struct MachO::linker_option_command);
8261 while (*string == '\0' && left > 0) {
8267 outs() << " string #" << i << " " << format("%.*s\n", left, string);
8268 uint32_t NullPos = StringRef(string, left).find('\0');
8269 uint32_t len = std::min(NullPos, left) + 1;
8275 outs() << " count " << lo.count << " does not match number of strings "
8279 static void PrintSubFrameworkCommand(MachO::sub_framework_command sub,
8281 outs() << " cmd LC_SUB_FRAMEWORK\n";
8282 outs() << " cmdsize " << sub.cmdsize;
8283 if (sub.cmdsize < sizeof(struct MachO::sub_framework_command))
8284 outs() << " Incorrect size\n";
8287 if (sub.umbrella < sub.cmdsize) {
8288 const char *P = Ptr + sub.umbrella;
8289 outs() << " umbrella " << P << " (offset " << sub.umbrella << ")\n";
8291 outs() << " umbrella ?(bad offset " << sub.umbrella << ")\n";
8295 static void PrintSubUmbrellaCommand(MachO::sub_umbrella_command sub,
8297 outs() << " cmd LC_SUB_UMBRELLA\n";
8298 outs() << " cmdsize " << sub.cmdsize;
8299 if (sub.cmdsize < sizeof(struct MachO::sub_umbrella_command))
8300 outs() << " Incorrect size\n";
8303 if (sub.sub_umbrella < sub.cmdsize) {
8304 const char *P = Ptr + sub.sub_umbrella;
8305 outs() << " sub_umbrella " << P << " (offset " << sub.sub_umbrella << ")\n";
8307 outs() << " sub_umbrella ?(bad offset " << sub.sub_umbrella << ")\n";
8311 static void PrintSubLibraryCommand(MachO::sub_library_command sub,
8313 outs() << " cmd LC_SUB_LIBRARY\n";
8314 outs() << " cmdsize " << sub.cmdsize;
8315 if (sub.cmdsize < sizeof(struct MachO::sub_library_command))
8316 outs() << " Incorrect size\n";
8319 if (sub.sub_library < sub.cmdsize) {
8320 const char *P = Ptr + sub.sub_library;
8321 outs() << " sub_library " << P << " (offset " << sub.sub_library << ")\n";
8323 outs() << " sub_library ?(bad offset " << sub.sub_library << ")\n";
8327 static void PrintSubClientCommand(MachO::sub_client_command sub,
8329 outs() << " cmd LC_SUB_CLIENT\n";
8330 outs() << " cmdsize " << sub.cmdsize;
8331 if (sub.cmdsize < sizeof(struct MachO::sub_client_command))
8332 outs() << " Incorrect size\n";
8335 if (sub.client < sub.cmdsize) {
8336 const char *P = Ptr + sub.client;
8337 outs() << " client " << P << " (offset " << sub.client << ")\n";
8339 outs() << " client ?(bad offset " << sub.client << ")\n";
8343 static void PrintRoutinesCommand(MachO::routines_command r) {
8344 outs() << " cmd LC_ROUTINES\n";
8345 outs() << " cmdsize " << r.cmdsize;
8346 if (r.cmdsize != sizeof(struct MachO::routines_command))
8347 outs() << " Incorrect size\n";
8350 outs() << " init_address " << format("0x%08" PRIx32, r.init_address) << "\n";
8351 outs() << " init_module " << r.init_module << "\n";
8352 outs() << " reserved1 " << r.reserved1 << "\n";
8353 outs() << " reserved2 " << r.reserved2 << "\n";
8354 outs() << " reserved3 " << r.reserved3 << "\n";
8355 outs() << " reserved4 " << r.reserved4 << "\n";
8356 outs() << " reserved5 " << r.reserved5 << "\n";
8357 outs() << " reserved6 " << r.reserved6 << "\n";
8360 static void PrintRoutinesCommand64(MachO::routines_command_64 r) {
8361 outs() << " cmd LC_ROUTINES_64\n";
8362 outs() << " cmdsize " << r.cmdsize;
8363 if (r.cmdsize != sizeof(struct MachO::routines_command_64))
8364 outs() << " Incorrect size\n";
8367 outs() << " init_address " << format("0x%016" PRIx64, r.init_address) << "\n";
8368 outs() << " init_module " << r.init_module << "\n";
8369 outs() << " reserved1 " << r.reserved1 << "\n";
8370 outs() << " reserved2 " << r.reserved2 << "\n";
8371 outs() << " reserved3 " << r.reserved3 << "\n";
8372 outs() << " reserved4 " << r.reserved4 << "\n";
8373 outs() << " reserved5 " << r.reserved5 << "\n";
8374 outs() << " reserved6 " << r.reserved6 << "\n";
8377 static void Print_x86_thread_state64_t(MachO::x86_thread_state64_t &cpu64) {
8378 outs() << " rax " << format("0x%016" PRIx64, cpu64.rax);
8379 outs() << " rbx " << format("0x%016" PRIx64, cpu64.rbx);
8380 outs() << " rcx " << format("0x%016" PRIx64, cpu64.rcx) << "\n";
8381 outs() << " rdx " << format("0x%016" PRIx64, cpu64.rdx);
8382 outs() << " rdi " << format("0x%016" PRIx64, cpu64.rdi);
8383 outs() << " rsi " << format("0x%016" PRIx64, cpu64.rsi) << "\n";
8384 outs() << " rbp " << format("0x%016" PRIx64, cpu64.rbp);
8385 outs() << " rsp " << format("0x%016" PRIx64, cpu64.rsp);
8386 outs() << " r8 " << format("0x%016" PRIx64, cpu64.r8) << "\n";
8387 outs() << " r9 " << format("0x%016" PRIx64, cpu64.r9);
8388 outs() << " r10 " << format("0x%016" PRIx64, cpu64.r10);
8389 outs() << " r11 " << format("0x%016" PRIx64, cpu64.r11) << "\n";
8390 outs() << " r12 " << format("0x%016" PRIx64, cpu64.r12);
8391 outs() << " r13 " << format("0x%016" PRIx64, cpu64.r13);
8392 outs() << " r14 " << format("0x%016" PRIx64, cpu64.r14) << "\n";
8393 outs() << " r15 " << format("0x%016" PRIx64, cpu64.r15);
8394 outs() << " rip " << format("0x%016" PRIx64, cpu64.rip) << "\n";
8395 outs() << "rflags " << format("0x%016" PRIx64, cpu64.rflags);
8396 outs() << " cs " << format("0x%016" PRIx64, cpu64.cs);
8397 outs() << " fs " << format("0x%016" PRIx64, cpu64.fs) << "\n";
8398 outs() << " gs " << format("0x%016" PRIx64, cpu64.gs) << "\n";
8401 static void Print_mmst_reg(MachO::mmst_reg_t &r) {
8403 outs() << "\t mmst_reg ";
8404 for (f = 0; f < 10; f++)
8405 outs() << format("%02" PRIx32, (r.mmst_reg[f] & 0xff)) << " ";
8407 outs() << "\t mmst_rsrv ";
8408 for (f = 0; f < 6; f++)
8409 outs() << format("%02" PRIx32, (r.mmst_rsrv[f] & 0xff)) << " ";
8413 static void Print_xmm_reg(MachO::xmm_reg_t &r) {
8415 outs() << "\t xmm_reg ";
8416 for (f = 0; f < 16; f++)
8417 outs() << format("%02" PRIx32, (r.xmm_reg[f] & 0xff)) << " ";
8421 static void Print_x86_float_state_t(MachO::x86_float_state64_t &fpu) {
8422 outs() << "\t fpu_reserved[0] " << fpu.fpu_reserved[0];
8423 outs() << " fpu_reserved[1] " << fpu.fpu_reserved[1] << "\n";
8424 outs() << "\t control: invalid " << fpu.fpu_fcw.invalid;
8425 outs() << " denorm " << fpu.fpu_fcw.denorm;
8426 outs() << " zdiv " << fpu.fpu_fcw.zdiv;
8427 outs() << " ovrfl " << fpu.fpu_fcw.ovrfl;
8428 outs() << " undfl " << fpu.fpu_fcw.undfl;
8429 outs() << " precis " << fpu.fpu_fcw.precis << "\n";
8430 outs() << "\t\t pc ";
8431 if (fpu.fpu_fcw.pc == MachO::x86_FP_PREC_24B)
8432 outs() << "FP_PREC_24B ";
8433 else if (fpu.fpu_fcw.pc == MachO::x86_FP_PREC_53B)
8434 outs() << "FP_PREC_53B ";
8435 else if (fpu.fpu_fcw.pc == MachO::x86_FP_PREC_64B)
8436 outs() << "FP_PREC_64B ";
8438 outs() << fpu.fpu_fcw.pc << " ";
8440 if (fpu.fpu_fcw.rc == MachO::x86_FP_RND_NEAR)
8441 outs() << "FP_RND_NEAR ";
8442 else if (fpu.fpu_fcw.rc == MachO::x86_FP_RND_DOWN)
8443 outs() << "FP_RND_DOWN ";
8444 else if (fpu.fpu_fcw.rc == MachO::x86_FP_RND_UP)
8445 outs() << "FP_RND_UP ";
8446 else if (fpu.fpu_fcw.rc == MachO::x86_FP_CHOP)
8447 outs() << "FP_CHOP ";
8449 outs() << "\t status: invalid " << fpu.fpu_fsw.invalid;
8450 outs() << " denorm " << fpu.fpu_fsw.denorm;
8451 outs() << " zdiv " << fpu.fpu_fsw.zdiv;
8452 outs() << " ovrfl " << fpu.fpu_fsw.ovrfl;
8453 outs() << " undfl " << fpu.fpu_fsw.undfl;
8454 outs() << " precis " << fpu.fpu_fsw.precis;
8455 outs() << " stkflt " << fpu.fpu_fsw.stkflt << "\n";
8456 outs() << "\t errsumm " << fpu.fpu_fsw.errsumm;
8457 outs() << " c0 " << fpu.fpu_fsw.c0;
8458 outs() << " c1 " << fpu.fpu_fsw.c1;
8459 outs() << " c2 " << fpu.fpu_fsw.c2;
8460 outs() << " tos " << fpu.fpu_fsw.tos;
8461 outs() << " c3 " << fpu.fpu_fsw.c3;
8462 outs() << " busy " << fpu.fpu_fsw.busy << "\n";
8463 outs() << "\t fpu_ftw " << format("0x%02" PRIx32, fpu.fpu_ftw);
8464 outs() << " fpu_rsrv1 " << format("0x%02" PRIx32, fpu.fpu_rsrv1);
8465 outs() << " fpu_fop " << format("0x%04" PRIx32, fpu.fpu_fop);
8466 outs() << " fpu_ip " << format("0x%08" PRIx32, fpu.fpu_ip) << "\n";
8467 outs() << "\t fpu_cs " << format("0x%04" PRIx32, fpu.fpu_cs);
8468 outs() << " fpu_rsrv2 " << format("0x%04" PRIx32, fpu.fpu_rsrv2);
8469 outs() << " fpu_dp " << format("0x%08" PRIx32, fpu.fpu_dp);
8470 outs() << " fpu_ds " << format("0x%04" PRIx32, fpu.fpu_ds) << "\n";
8471 outs() << "\t fpu_rsrv3 " << format("0x%04" PRIx32, fpu.fpu_rsrv3);
8472 outs() << " fpu_mxcsr " << format("0x%08" PRIx32, fpu.fpu_mxcsr);
8473 outs() << " fpu_mxcsrmask " << format("0x%08" PRIx32, fpu.fpu_mxcsrmask);
8475 outs() << "\t fpu_stmm0:\n";
8476 Print_mmst_reg(fpu.fpu_stmm0);
8477 outs() << "\t fpu_stmm1:\n";
8478 Print_mmst_reg(fpu.fpu_stmm1);
8479 outs() << "\t fpu_stmm2:\n";
8480 Print_mmst_reg(fpu.fpu_stmm2);
8481 outs() << "\t fpu_stmm3:\n";
8482 Print_mmst_reg(fpu.fpu_stmm3);
8483 outs() << "\t fpu_stmm4:\n";
8484 Print_mmst_reg(fpu.fpu_stmm4);
8485 outs() << "\t fpu_stmm5:\n";
8486 Print_mmst_reg(fpu.fpu_stmm5);
8487 outs() << "\t fpu_stmm6:\n";
8488 Print_mmst_reg(fpu.fpu_stmm6);
8489 outs() << "\t fpu_stmm7:\n";
8490 Print_mmst_reg(fpu.fpu_stmm7);
8491 outs() << "\t fpu_xmm0:\n";
8492 Print_xmm_reg(fpu.fpu_xmm0);
8493 outs() << "\t fpu_xmm1:\n";
8494 Print_xmm_reg(fpu.fpu_xmm1);
8495 outs() << "\t fpu_xmm2:\n";
8496 Print_xmm_reg(fpu.fpu_xmm2);
8497 outs() << "\t fpu_xmm3:\n";
8498 Print_xmm_reg(fpu.fpu_xmm3);
8499 outs() << "\t fpu_xmm4:\n";
8500 Print_xmm_reg(fpu.fpu_xmm4);
8501 outs() << "\t fpu_xmm5:\n";
8502 Print_xmm_reg(fpu.fpu_xmm5);
8503 outs() << "\t fpu_xmm6:\n";
8504 Print_xmm_reg(fpu.fpu_xmm6);
8505 outs() << "\t fpu_xmm7:\n";
8506 Print_xmm_reg(fpu.fpu_xmm7);
8507 outs() << "\t fpu_xmm8:\n";
8508 Print_xmm_reg(fpu.fpu_xmm8);
8509 outs() << "\t fpu_xmm9:\n";
8510 Print_xmm_reg(fpu.fpu_xmm9);
8511 outs() << "\t fpu_xmm10:\n";
8512 Print_xmm_reg(fpu.fpu_xmm10);
8513 outs() << "\t fpu_xmm11:\n";
8514 Print_xmm_reg(fpu.fpu_xmm11);
8515 outs() << "\t fpu_xmm12:\n";
8516 Print_xmm_reg(fpu.fpu_xmm12);
8517 outs() << "\t fpu_xmm13:\n";
8518 Print_xmm_reg(fpu.fpu_xmm13);
8519 outs() << "\t fpu_xmm14:\n";
8520 Print_xmm_reg(fpu.fpu_xmm14);
8521 outs() << "\t fpu_xmm15:\n";
8522 Print_xmm_reg(fpu.fpu_xmm15);
8523 outs() << "\t fpu_rsrv4:\n";
8524 for (uint32_t f = 0; f < 6; f++) {
8526 for (uint32_t g = 0; g < 16; g++)
8527 outs() << format("%02" PRIx32, fpu.fpu_rsrv4[f * g]) << " ";
8530 outs() << "\t fpu_reserved1 " << format("0x%08" PRIx32, fpu.fpu_reserved1);
8534 static void Print_x86_exception_state_t(MachO::x86_exception_state64_t &exc64) {
8535 outs() << "\t trapno " << format("0x%08" PRIx32, exc64.trapno);
8536 outs() << " err " << format("0x%08" PRIx32, exc64.err);
8537 outs() << " faultvaddr " << format("0x%016" PRIx64, exc64.faultvaddr) << "\n";
8540 static void Print_arm_thread_state32_t(MachO::arm_thread_state32_t &cpu32) {
8541 outs() << "\t r0 " << format("0x%08" PRIx32, cpu32.r[0]);
8542 outs() << " r1 " << format("0x%08" PRIx32, cpu32.r[1]);
8543 outs() << " r2 " << format("0x%08" PRIx32, cpu32.r[2]);
8544 outs() << " r3 " << format("0x%08" PRIx32, cpu32.r[3]) << "\n";
8545 outs() << "\t r4 " << format("0x%08" PRIx32, cpu32.r[4]);
8546 outs() << " r5 " << format("0x%08" PRIx32, cpu32.r[5]);
8547 outs() << " r6 " << format("0x%08" PRIx32, cpu32.r[6]);
8548 outs() << " r7 " << format("0x%08" PRIx32, cpu32.r[7]) << "\n";
8549 outs() << "\t r8 " << format("0x%08" PRIx32, cpu32.r[8]);
8550 outs() << " r9 " << format("0x%08" PRIx32, cpu32.r[9]);
8551 outs() << " r10 " << format("0x%08" PRIx32, cpu32.r[10]);
8552 outs() << " r11 " << format("0x%08" PRIx32, cpu32.r[11]) << "\n";
8553 outs() << "\t r12 " << format("0x%08" PRIx32, cpu32.r[12]);
8554 outs() << " sp " << format("0x%08" PRIx32, cpu32.sp);
8555 outs() << " lr " << format("0x%08" PRIx32, cpu32.lr);
8556 outs() << " pc " << format("0x%08" PRIx32, cpu32.pc) << "\n";
8557 outs() << "\t cpsr " << format("0x%08" PRIx32, cpu32.cpsr) << "\n";
8560 static void Print_arm_thread_state64_t(MachO::arm_thread_state64_t &cpu64) {
8561 outs() << "\t x0 " << format("0x%016" PRIx64, cpu64.x[0]);
8562 outs() << " x1 " << format("0x%016" PRIx64, cpu64.x[1]);
8563 outs() << " x2 " << format("0x%016" PRIx64, cpu64.x[2]) << "\n";
8564 outs() << "\t x3 " << format("0x%016" PRIx64, cpu64.x[3]);
8565 outs() << " x4 " << format("0x%016" PRIx64, cpu64.x[4]);
8566 outs() << " x5 " << format("0x%016" PRIx64, cpu64.x[5]) << "\n";
8567 outs() << "\t x6 " << format("0x%016" PRIx64, cpu64.x[6]);
8568 outs() << " x7 " << format("0x%016" PRIx64, cpu64.x[7]);
8569 outs() << " x8 " << format("0x%016" PRIx64, cpu64.x[8]) << "\n";
8570 outs() << "\t x9 " << format("0x%016" PRIx64, cpu64.x[9]);
8571 outs() << " x10 " << format("0x%016" PRIx64, cpu64.x[10]);
8572 outs() << " x11 " << format("0x%016" PRIx64, cpu64.x[11]) << "\n";
8573 outs() << "\t x12 " << format("0x%016" PRIx64, cpu64.x[12]);
8574 outs() << " x13 " << format("0x%016" PRIx64, cpu64.x[13]);
8575 outs() << " x14 " << format("0x%016" PRIx64, cpu64.x[14]) << "\n";
8576 outs() << "\t x15 " << format("0x%016" PRIx64, cpu64.x[15]);
8577 outs() << " x16 " << format("0x%016" PRIx64, cpu64.x[16]);
8578 outs() << " x17 " << format("0x%016" PRIx64, cpu64.x[17]) << "\n";
8579 outs() << "\t x18 " << format("0x%016" PRIx64, cpu64.x[18]);
8580 outs() << " x19 " << format("0x%016" PRIx64, cpu64.x[19]);
8581 outs() << " x20 " << format("0x%016" PRIx64, cpu64.x[20]) << "\n";
8582 outs() << "\t x21 " << format("0x%016" PRIx64, cpu64.x[21]);
8583 outs() << " x22 " << format("0x%016" PRIx64, cpu64.x[22]);
8584 outs() << " x23 " << format("0x%016" PRIx64, cpu64.x[23]) << "\n";
8585 outs() << "\t x24 " << format("0x%016" PRIx64, cpu64.x[24]);
8586 outs() << " x25 " << format("0x%016" PRIx64, cpu64.x[25]);
8587 outs() << " x26 " << format("0x%016" PRIx64, cpu64.x[26]) << "\n";
8588 outs() << "\t x27 " << format("0x%016" PRIx64, cpu64.x[27]);
8589 outs() << " x28 " << format("0x%016" PRIx64, cpu64.x[28]);
8590 outs() << " fp " << format("0x%016" PRIx64, cpu64.fp) << "\n";
8591 outs() << "\t lr " << format("0x%016" PRIx64, cpu64.lr);
8592 outs() << " sp " << format("0x%016" PRIx64, cpu64.sp);
8593 outs() << " pc " << format("0x%016" PRIx64, cpu64.pc) << "\n";
8594 outs() << "\t cpsr " << format("0x%08" PRIx32, cpu64.cpsr) << "\n";
8597 static void PrintThreadCommand(MachO::thread_command t, const char *Ptr,
8598 bool isLittleEndian, uint32_t cputype) {
8599 if (t.cmd == MachO::LC_THREAD)
8600 outs() << " cmd LC_THREAD\n";
8601 else if (t.cmd == MachO::LC_UNIXTHREAD)
8602 outs() << " cmd LC_UNIXTHREAD\n";
8604 outs() << " cmd " << t.cmd << " (unknown)\n";
8605 outs() << " cmdsize " << t.cmdsize;
8606 if (t.cmdsize < sizeof(struct MachO::thread_command) + 2 * sizeof(uint32_t))
8607 outs() << " Incorrect size\n";
8611 const char *begin = Ptr + sizeof(struct MachO::thread_command);
8612 const char *end = Ptr + t.cmdsize;
8613 uint32_t flavor, count, left;
8614 if (cputype == MachO::CPU_TYPE_X86_64) {
8615 while (begin < end) {
8616 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8617 memcpy((char *)&flavor, begin, sizeof(uint32_t));
8618 begin += sizeof(uint32_t);
8623 if (isLittleEndian != sys::IsLittleEndianHost)
8624 sys::swapByteOrder(flavor);
8625 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8626 memcpy((char *)&count, begin, sizeof(uint32_t));
8627 begin += sizeof(uint32_t);
8632 if (isLittleEndian != sys::IsLittleEndianHost)
8633 sys::swapByteOrder(count);
8634 if (flavor == MachO::x86_THREAD_STATE64) {
8635 outs() << " flavor x86_THREAD_STATE64\n";
8636 if (count == MachO::x86_THREAD_STATE64_COUNT)
8637 outs() << " count x86_THREAD_STATE64_COUNT\n";
8639 outs() << " count " << count
8640 << " (not x86_THREAD_STATE64_COUNT)\n";
8641 MachO::x86_thread_state64_t cpu64;
8643 if (left >= sizeof(MachO::x86_thread_state64_t)) {
8644 memcpy(&cpu64, begin, sizeof(MachO::x86_thread_state64_t));
8645 begin += sizeof(MachO::x86_thread_state64_t);
8647 memset(&cpu64, '\0', sizeof(MachO::x86_thread_state64_t));
8648 memcpy(&cpu64, begin, left);
8651 if (isLittleEndian != sys::IsLittleEndianHost)
8653 Print_x86_thread_state64_t(cpu64);
8654 } else if (flavor == MachO::x86_THREAD_STATE) {
8655 outs() << " flavor x86_THREAD_STATE\n";
8656 if (count == MachO::x86_THREAD_STATE_COUNT)
8657 outs() << " count x86_THREAD_STATE_COUNT\n";
8659 outs() << " count " << count
8660 << " (not x86_THREAD_STATE_COUNT)\n";
8661 struct MachO::x86_thread_state_t ts;
8663 if (left >= sizeof(MachO::x86_thread_state_t)) {
8664 memcpy(&ts, begin, sizeof(MachO::x86_thread_state_t));
8665 begin += sizeof(MachO::x86_thread_state_t);
8667 memset(&ts, '\0', sizeof(MachO::x86_thread_state_t));
8668 memcpy(&ts, begin, left);
8671 if (isLittleEndian != sys::IsLittleEndianHost)
8673 if (ts.tsh.flavor == MachO::x86_THREAD_STATE64) {
8674 outs() << "\t tsh.flavor x86_THREAD_STATE64 ";
8675 if (ts.tsh.count == MachO::x86_THREAD_STATE64_COUNT)
8676 outs() << "tsh.count x86_THREAD_STATE64_COUNT\n";
8678 outs() << "tsh.count " << ts.tsh.count
8679 << " (not x86_THREAD_STATE64_COUNT\n";
8680 Print_x86_thread_state64_t(ts.uts.ts64);
8682 outs() << "\t tsh.flavor " << ts.tsh.flavor << " tsh.count "
8683 << ts.tsh.count << "\n";
8685 } else if (flavor == MachO::x86_FLOAT_STATE) {
8686 outs() << " flavor x86_FLOAT_STATE\n";
8687 if (count == MachO::x86_FLOAT_STATE_COUNT)
8688 outs() << " count x86_FLOAT_STATE_COUNT\n";
8690 outs() << " count " << count << " (not x86_FLOAT_STATE_COUNT)\n";
8691 struct MachO::x86_float_state_t fs;
8693 if (left >= sizeof(MachO::x86_float_state_t)) {
8694 memcpy(&fs, begin, sizeof(MachO::x86_float_state_t));
8695 begin += sizeof(MachO::x86_float_state_t);
8697 memset(&fs, '\0', sizeof(MachO::x86_float_state_t));
8698 memcpy(&fs, begin, left);
8701 if (isLittleEndian != sys::IsLittleEndianHost)
8703 if (fs.fsh.flavor == MachO::x86_FLOAT_STATE64) {
8704 outs() << "\t fsh.flavor x86_FLOAT_STATE64 ";
8705 if (fs.fsh.count == MachO::x86_FLOAT_STATE64_COUNT)
8706 outs() << "fsh.count x86_FLOAT_STATE64_COUNT\n";
8708 outs() << "fsh.count " << fs.fsh.count
8709 << " (not x86_FLOAT_STATE64_COUNT\n";
8710 Print_x86_float_state_t(fs.ufs.fs64);
8712 outs() << "\t fsh.flavor " << fs.fsh.flavor << " fsh.count "
8713 << fs.fsh.count << "\n";
8715 } else if (flavor == MachO::x86_EXCEPTION_STATE) {
8716 outs() << " flavor x86_EXCEPTION_STATE\n";
8717 if (count == MachO::x86_EXCEPTION_STATE_COUNT)
8718 outs() << " count x86_EXCEPTION_STATE_COUNT\n";
8720 outs() << " count " << count
8721 << " (not x86_EXCEPTION_STATE_COUNT)\n";
8722 struct MachO::x86_exception_state_t es;
8724 if (left >= sizeof(MachO::x86_exception_state_t)) {
8725 memcpy(&es, begin, sizeof(MachO::x86_exception_state_t));
8726 begin += sizeof(MachO::x86_exception_state_t);
8728 memset(&es, '\0', sizeof(MachO::x86_exception_state_t));
8729 memcpy(&es, begin, left);
8732 if (isLittleEndian != sys::IsLittleEndianHost)
8734 if (es.esh.flavor == MachO::x86_EXCEPTION_STATE64) {
8735 outs() << "\t esh.flavor x86_EXCEPTION_STATE64\n";
8736 if (es.esh.count == MachO::x86_EXCEPTION_STATE64_COUNT)
8737 outs() << "\t esh.count x86_EXCEPTION_STATE64_COUNT\n";
8739 outs() << "\t esh.count " << es.esh.count
8740 << " (not x86_EXCEPTION_STATE64_COUNT\n";
8741 Print_x86_exception_state_t(es.ues.es64);
8743 outs() << "\t esh.flavor " << es.esh.flavor << " esh.count "
8744 << es.esh.count << "\n";
8747 outs() << " flavor " << flavor << " (unknown)\n";
8748 outs() << " count " << count << "\n";
8749 outs() << " state (unknown)\n";
8750 begin += count * sizeof(uint32_t);
8753 } else if (cputype == MachO::CPU_TYPE_ARM) {
8754 while (begin < end) {
8755 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8756 memcpy((char *)&flavor, begin, sizeof(uint32_t));
8757 begin += sizeof(uint32_t);
8762 if (isLittleEndian != sys::IsLittleEndianHost)
8763 sys::swapByteOrder(flavor);
8764 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8765 memcpy((char *)&count, begin, sizeof(uint32_t));
8766 begin += sizeof(uint32_t);
8771 if (isLittleEndian != sys::IsLittleEndianHost)
8772 sys::swapByteOrder(count);
8773 if (flavor == MachO::ARM_THREAD_STATE) {
8774 outs() << " flavor ARM_THREAD_STATE\n";
8775 if (count == MachO::ARM_THREAD_STATE_COUNT)
8776 outs() << " count ARM_THREAD_STATE_COUNT\n";
8778 outs() << " count " << count
8779 << " (not ARM_THREAD_STATE_COUNT)\n";
8780 MachO::arm_thread_state32_t cpu32;
8782 if (left >= sizeof(MachO::arm_thread_state32_t)) {
8783 memcpy(&cpu32, begin, sizeof(MachO::arm_thread_state32_t));
8784 begin += sizeof(MachO::arm_thread_state32_t);
8786 memset(&cpu32, '\0', sizeof(MachO::arm_thread_state32_t));
8787 memcpy(&cpu32, begin, left);
8790 if (isLittleEndian != sys::IsLittleEndianHost)
8792 Print_arm_thread_state32_t(cpu32);
8794 outs() << " flavor " << flavor << " (unknown)\n";
8795 outs() << " count " << count << "\n";
8796 outs() << " state (unknown)\n";
8797 begin += count * sizeof(uint32_t);
8800 } else if (cputype == MachO::CPU_TYPE_ARM64) {
8801 while (begin < end) {
8802 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8803 memcpy((char *)&flavor, begin, sizeof(uint32_t));
8804 begin += sizeof(uint32_t);
8809 if (isLittleEndian != sys::IsLittleEndianHost)
8810 sys::swapByteOrder(flavor);
8811 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8812 memcpy((char *)&count, begin, sizeof(uint32_t));
8813 begin += sizeof(uint32_t);
8818 if (isLittleEndian != sys::IsLittleEndianHost)
8819 sys::swapByteOrder(count);
8820 if (flavor == MachO::ARM_THREAD_STATE64) {
8821 outs() << " flavor ARM_THREAD_STATE64\n";
8822 if (count == MachO::ARM_THREAD_STATE64_COUNT)
8823 outs() << " count ARM_THREAD_STATE64_COUNT\n";
8825 outs() << " count " << count
8826 << " (not ARM_THREAD_STATE64_COUNT)\n";
8827 MachO::arm_thread_state64_t cpu64;
8829 if (left >= sizeof(MachO::arm_thread_state64_t)) {
8830 memcpy(&cpu64, begin, sizeof(MachO::arm_thread_state64_t));
8831 begin += sizeof(MachO::arm_thread_state64_t);
8833 memset(&cpu64, '\0', sizeof(MachO::arm_thread_state64_t));
8834 memcpy(&cpu64, begin, left);
8837 if (isLittleEndian != sys::IsLittleEndianHost)
8839 Print_arm_thread_state64_t(cpu64);
8841 outs() << " flavor " << flavor << " (unknown)\n";
8842 outs() << " count " << count << "\n";
8843 outs() << " state (unknown)\n";
8844 begin += count * sizeof(uint32_t);
8848 while (begin < end) {
8849 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8850 memcpy((char *)&flavor, begin, sizeof(uint32_t));
8851 begin += sizeof(uint32_t);
8856 if (isLittleEndian != sys::IsLittleEndianHost)
8857 sys::swapByteOrder(flavor);
8858 if (end - begin > (ptrdiff_t)sizeof(uint32_t)) {
8859 memcpy((char *)&count, begin, sizeof(uint32_t));
8860 begin += sizeof(uint32_t);
8865 if (isLittleEndian != sys::IsLittleEndianHost)
8866 sys::swapByteOrder(count);
8867 outs() << " flavor " << flavor << "\n";
8868 outs() << " count " << count << "\n";
8869 outs() << " state (Unknown cputype/cpusubtype)\n";
8870 begin += count * sizeof(uint32_t);
8875 static void PrintDylibCommand(MachO::dylib_command dl, const char *Ptr) {
8876 if (dl.cmd == MachO::LC_ID_DYLIB)
8877 outs() << " cmd LC_ID_DYLIB\n";
8878 else if (dl.cmd == MachO::LC_LOAD_DYLIB)
8879 outs() << " cmd LC_LOAD_DYLIB\n";
8880 else if (dl.cmd == MachO::LC_LOAD_WEAK_DYLIB)
8881 outs() << " cmd LC_LOAD_WEAK_DYLIB\n";
8882 else if (dl.cmd == MachO::LC_REEXPORT_DYLIB)
8883 outs() << " cmd LC_REEXPORT_DYLIB\n";
8884 else if (dl.cmd == MachO::LC_LAZY_LOAD_DYLIB)
8885 outs() << " cmd LC_LAZY_LOAD_DYLIB\n";
8886 else if (dl.cmd == MachO::LC_LOAD_UPWARD_DYLIB)
8887 outs() << " cmd LC_LOAD_UPWARD_DYLIB\n";
8889 outs() << " cmd " << dl.cmd << " (unknown)\n";
8890 outs() << " cmdsize " << dl.cmdsize;
8891 if (dl.cmdsize < sizeof(struct MachO::dylib_command))
8892 outs() << " Incorrect size\n";
8895 if (dl.dylib.name < dl.cmdsize) {
8896 const char *P = (const char *)(Ptr) + dl.dylib.name;
8897 outs() << " name " << P << " (offset " << dl.dylib.name << ")\n";
8899 outs() << " name ?(bad offset " << dl.dylib.name << ")\n";
8901 outs() << " time stamp " << dl.dylib.timestamp << " ";
8902 time_t t = dl.dylib.timestamp;
8903 outs() << ctime(&t);
8904 outs() << " current version ";
8905 if (dl.dylib.current_version == 0xffffffff)
8908 outs() << ((dl.dylib.current_version >> 16) & 0xffff) << "."
8909 << ((dl.dylib.current_version >> 8) & 0xff) << "."
8910 << (dl.dylib.current_version & 0xff) << "\n";
8911 outs() << "compatibility version ";
8912 if (dl.dylib.compatibility_version == 0xffffffff)
8915 outs() << ((dl.dylib.compatibility_version >> 16) & 0xffff) << "."
8916 << ((dl.dylib.compatibility_version >> 8) & 0xff) << "."
8917 << (dl.dylib.compatibility_version & 0xff) << "\n";
8920 static void PrintLinkEditDataCommand(MachO::linkedit_data_command ld,
8921 uint32_t object_size) {
8922 if (ld.cmd == MachO::LC_CODE_SIGNATURE)
8923 outs() << " cmd LC_CODE_SIGNATURE\n";
8924 else if (ld.cmd == MachO::LC_SEGMENT_SPLIT_INFO)
8925 outs() << " cmd LC_SEGMENT_SPLIT_INFO\n";
8926 else if (ld.cmd == MachO::LC_FUNCTION_STARTS)
8927 outs() << " cmd LC_FUNCTION_STARTS\n";
8928 else if (ld.cmd == MachO::LC_DATA_IN_CODE)
8929 outs() << " cmd LC_DATA_IN_CODE\n";
8930 else if (ld.cmd == MachO::LC_DYLIB_CODE_SIGN_DRS)
8931 outs() << " cmd LC_DYLIB_CODE_SIGN_DRS\n";
8932 else if (ld.cmd == MachO::LC_LINKER_OPTIMIZATION_HINT)
8933 outs() << " cmd LC_LINKER_OPTIMIZATION_HINT\n";
8935 outs() << " cmd " << ld.cmd << " (?)\n";
8936 outs() << " cmdsize " << ld.cmdsize;
8937 if (ld.cmdsize != sizeof(struct MachO::linkedit_data_command))
8938 outs() << " Incorrect size\n";
8941 outs() << " dataoff " << ld.dataoff;
8942 if (ld.dataoff > object_size)
8943 outs() << " (past end of file)\n";
8946 outs() << " datasize " << ld.datasize;
8947 uint64_t big_size = ld.dataoff;
8948 big_size += ld.datasize;
8949 if (big_size > object_size)
8950 outs() << " (past end of file)\n";
8955 static void PrintLoadCommands(const MachOObjectFile *Obj, uint32_t filetype,
8956 uint32_t cputype, bool verbose) {
8957 StringRef Buf = Obj->getData();
8959 for (const auto &Command : Obj->load_commands()) {
8960 outs() << "Load command " << Index++ << "\n";
8961 if (Command.C.cmd == MachO::LC_SEGMENT) {
8962 MachO::segment_command SLC = Obj->getSegmentLoadCommand(Command);
8963 const char *sg_segname = SLC.segname;
8964 PrintSegmentCommand(SLC.cmd, SLC.cmdsize, SLC.segname, SLC.vmaddr,
8965 SLC.vmsize, SLC.fileoff, SLC.filesize, SLC.maxprot,
8966 SLC.initprot, SLC.nsects, SLC.flags, Buf.size(),
8968 for (unsigned j = 0; j < SLC.nsects; j++) {
8969 MachO::section S = Obj->getSection(Command, j);
8970 PrintSection(S.sectname, S.segname, S.addr, S.size, S.offset, S.align,
8971 S.reloff, S.nreloc, S.flags, S.reserved1, S.reserved2,
8972 SLC.cmd, sg_segname, filetype, Buf.size(), verbose);
8974 } else if (Command.C.cmd == MachO::LC_SEGMENT_64) {
8975 MachO::segment_command_64 SLC_64 = Obj->getSegment64LoadCommand(Command);
8976 const char *sg_segname = SLC_64.segname;
8977 PrintSegmentCommand(SLC_64.cmd, SLC_64.cmdsize, SLC_64.segname,
8978 SLC_64.vmaddr, SLC_64.vmsize, SLC_64.fileoff,
8979 SLC_64.filesize, SLC_64.maxprot, SLC_64.initprot,
8980 SLC_64.nsects, SLC_64.flags, Buf.size(), verbose);
8981 for (unsigned j = 0; j < SLC_64.nsects; j++) {
8982 MachO::section_64 S_64 = Obj->getSection64(Command, j);
8983 PrintSection(S_64.sectname, S_64.segname, S_64.addr, S_64.size,
8984 S_64.offset, S_64.align, S_64.reloff, S_64.nreloc,
8985 S_64.flags, S_64.reserved1, S_64.reserved2, SLC_64.cmd,
8986 sg_segname, filetype, Buf.size(), verbose);
8988 } else if (Command.C.cmd == MachO::LC_SYMTAB) {
8989 MachO::symtab_command Symtab = Obj->getSymtabLoadCommand();
8990 PrintSymtabLoadCommand(Symtab, Obj->is64Bit(), Buf.size());
8991 } else if (Command.C.cmd == MachO::LC_DYSYMTAB) {
8992 MachO::dysymtab_command Dysymtab = Obj->getDysymtabLoadCommand();
8993 MachO::symtab_command Symtab = Obj->getSymtabLoadCommand();
8994 PrintDysymtabLoadCommand(Dysymtab, Symtab.nsyms, Buf.size(),
8996 } else if (Command.C.cmd == MachO::LC_DYLD_INFO ||
8997 Command.C.cmd == MachO::LC_DYLD_INFO_ONLY) {
8998 MachO::dyld_info_command DyldInfo = Obj->getDyldInfoLoadCommand(Command);
8999 PrintDyldInfoLoadCommand(DyldInfo, Buf.size());
9000 } else if (Command.C.cmd == MachO::LC_LOAD_DYLINKER ||
9001 Command.C.cmd == MachO::LC_ID_DYLINKER ||
9002 Command.C.cmd == MachO::LC_DYLD_ENVIRONMENT) {
9003 MachO::dylinker_command Dyld = Obj->getDylinkerCommand(Command);
9004 PrintDyldLoadCommand(Dyld, Command.Ptr);
9005 } else if (Command.C.cmd == MachO::LC_UUID) {
9006 MachO::uuid_command Uuid = Obj->getUuidCommand(Command);
9007 PrintUuidLoadCommand(Uuid);
9008 } else if (Command.C.cmd == MachO::LC_RPATH) {
9009 MachO::rpath_command Rpath = Obj->getRpathCommand(Command);
9010 PrintRpathLoadCommand(Rpath, Command.Ptr);
9011 } else if (Command.C.cmd == MachO::LC_VERSION_MIN_MACOSX ||
9012 Command.C.cmd == MachO::LC_VERSION_MIN_IPHONEOS ||
9013 Command.C.cmd == MachO::LC_VERSION_MIN_TVOS ||
9014 Command.C.cmd == MachO::LC_VERSION_MIN_WATCHOS) {
9015 MachO::version_min_command Vd = Obj->getVersionMinLoadCommand(Command);
9016 PrintVersionMinLoadCommand(Vd);
9017 } else if (Command.C.cmd == MachO::LC_SOURCE_VERSION) {
9018 MachO::source_version_command Sd = Obj->getSourceVersionCommand(Command);
9019 PrintSourceVersionCommand(Sd);
9020 } else if (Command.C.cmd == MachO::LC_MAIN) {
9021 MachO::entry_point_command Ep = Obj->getEntryPointCommand(Command);
9022 PrintEntryPointCommand(Ep);
9023 } else if (Command.C.cmd == MachO::LC_ENCRYPTION_INFO) {
9024 MachO::encryption_info_command Ei =
9025 Obj->getEncryptionInfoCommand(Command);
9026 PrintEncryptionInfoCommand(Ei, Buf.size());
9027 } else if (Command.C.cmd == MachO::LC_ENCRYPTION_INFO_64) {
9028 MachO::encryption_info_command_64 Ei =
9029 Obj->getEncryptionInfoCommand64(Command);
9030 PrintEncryptionInfoCommand64(Ei, Buf.size());
9031 } else if (Command.C.cmd == MachO::LC_LINKER_OPTION) {
9032 MachO::linker_option_command Lo =
9033 Obj->getLinkerOptionLoadCommand(Command);
9034 PrintLinkerOptionCommand(Lo, Command.Ptr);
9035 } else if (Command.C.cmd == MachO::LC_SUB_FRAMEWORK) {
9036 MachO::sub_framework_command Sf = Obj->getSubFrameworkCommand(Command);
9037 PrintSubFrameworkCommand(Sf, Command.Ptr);
9038 } else if (Command.C.cmd == MachO::LC_SUB_UMBRELLA) {
9039 MachO::sub_umbrella_command Sf = Obj->getSubUmbrellaCommand(Command);
9040 PrintSubUmbrellaCommand(Sf, Command.Ptr);
9041 } else if (Command.C.cmd == MachO::LC_SUB_LIBRARY) {
9042 MachO::sub_library_command Sl = Obj->getSubLibraryCommand(Command);
9043 PrintSubLibraryCommand(Sl, Command.Ptr);
9044 } else if (Command.C.cmd == MachO::LC_SUB_CLIENT) {
9045 MachO::sub_client_command Sc = Obj->getSubClientCommand(Command);
9046 PrintSubClientCommand(Sc, Command.Ptr);
9047 } else if (Command.C.cmd == MachO::LC_ROUTINES) {
9048 MachO::routines_command Rc = Obj->getRoutinesCommand(Command);
9049 PrintRoutinesCommand(Rc);
9050 } else if (Command.C.cmd == MachO::LC_ROUTINES_64) {
9051 MachO::routines_command_64 Rc = Obj->getRoutinesCommand64(Command);
9052 PrintRoutinesCommand64(Rc);
9053 } else if (Command.C.cmd == MachO::LC_THREAD ||
9054 Command.C.cmd == MachO::LC_UNIXTHREAD) {
9055 MachO::thread_command Tc = Obj->getThreadCommand(Command);
9056 PrintThreadCommand(Tc, Command.Ptr, Obj->isLittleEndian(), cputype);
9057 } else if (Command.C.cmd == MachO::LC_LOAD_DYLIB ||
9058 Command.C.cmd == MachO::LC_ID_DYLIB ||
9059 Command.C.cmd == MachO::LC_LOAD_WEAK_DYLIB ||
9060 Command.C.cmd == MachO::LC_REEXPORT_DYLIB ||
9061 Command.C.cmd == MachO::LC_LAZY_LOAD_DYLIB ||
9062 Command.C.cmd == MachO::LC_LOAD_UPWARD_DYLIB) {
9063 MachO::dylib_command Dl = Obj->getDylibIDLoadCommand(Command);
9064 PrintDylibCommand(Dl, Command.Ptr);
9065 } else if (Command.C.cmd == MachO::LC_CODE_SIGNATURE ||
9066 Command.C.cmd == MachO::LC_SEGMENT_SPLIT_INFO ||
9067 Command.C.cmd == MachO::LC_FUNCTION_STARTS ||
9068 Command.C.cmd == MachO::LC_DATA_IN_CODE ||
9069 Command.C.cmd == MachO::LC_DYLIB_CODE_SIGN_DRS ||
9070 Command.C.cmd == MachO::LC_LINKER_OPTIMIZATION_HINT) {
9071 MachO::linkedit_data_command Ld =
9072 Obj->getLinkeditDataLoadCommand(Command);
9073 PrintLinkEditDataCommand(Ld, Buf.size());
9075 outs() << " cmd ?(" << format("0x%08" PRIx32, Command.C.cmd)
9077 outs() << " cmdsize " << Command.C.cmdsize << "\n";
9078 // TODO: get and print the raw bytes of the load command.
9080 // TODO: print all the other kinds of load commands.
9084 static void PrintMachHeader(const MachOObjectFile *Obj, bool verbose) {
9085 if (Obj->is64Bit()) {
9086 MachO::mach_header_64 H_64;
9087 H_64 = Obj->getHeader64();
9088 PrintMachHeader(H_64.magic, H_64.cputype, H_64.cpusubtype, H_64.filetype,
9089 H_64.ncmds, H_64.sizeofcmds, H_64.flags, verbose);
9091 MachO::mach_header H;
9092 H = Obj->getHeader();
9093 PrintMachHeader(H.magic, H.cputype, H.cpusubtype, H.filetype, H.ncmds,
9094 H.sizeofcmds, H.flags, verbose);
9098 void llvm::printMachOFileHeader(const object::ObjectFile *Obj) {
9099 const MachOObjectFile *file = dyn_cast<const MachOObjectFile>(Obj);
9100 PrintMachHeader(file, !NonVerbose);
9103 void llvm::printMachOLoadCommands(const object::ObjectFile *Obj) {
9104 const MachOObjectFile *file = dyn_cast<const MachOObjectFile>(Obj);
9105 uint32_t filetype = 0;
9106 uint32_t cputype = 0;
9107 if (file->is64Bit()) {
9108 MachO::mach_header_64 H_64;
9109 H_64 = file->getHeader64();
9110 filetype = H_64.filetype;
9111 cputype = H_64.cputype;
9113 MachO::mach_header H;
9114 H = file->getHeader();
9115 filetype = H.filetype;
9116 cputype = H.cputype;
9118 PrintLoadCommands(file, filetype, cputype, !NonVerbose);
9121 //===----------------------------------------------------------------------===//
9122 // export trie dumping
9123 //===----------------------------------------------------------------------===//
9125 void llvm::printMachOExportsTrie(const object::MachOObjectFile *Obj) {
9126 for (const llvm::object::ExportEntry &Entry : Obj->exports()) {
9127 uint64_t Flags = Entry.flags();
9128 bool ReExport = (Flags & MachO::EXPORT_SYMBOL_FLAGS_REEXPORT);
9129 bool WeakDef = (Flags & MachO::EXPORT_SYMBOL_FLAGS_WEAK_DEFINITION);
9130 bool ThreadLocal = ((Flags & MachO::EXPORT_SYMBOL_FLAGS_KIND_MASK) ==
9131 MachO::EXPORT_SYMBOL_FLAGS_KIND_THREAD_LOCAL);
9132 bool Abs = ((Flags & MachO::EXPORT_SYMBOL_FLAGS_KIND_MASK) ==
9133 MachO::EXPORT_SYMBOL_FLAGS_KIND_ABSOLUTE);
9134 bool Resolver = (Flags & MachO::EXPORT_SYMBOL_FLAGS_STUB_AND_RESOLVER);
9136 outs() << "[re-export] ";
9138 outs() << format("0x%08llX ",
9139 Entry.address()); // FIXME:add in base address
9140 outs() << Entry.name();
9141 if (WeakDef || ThreadLocal || Resolver || Abs) {
9142 bool NeedsComma = false;
9145 outs() << "weak_def";
9151 outs() << "per-thread";
9157 outs() << "absolute";
9163 outs() << format("resolver=0x%08llX", Entry.other());
9169 StringRef DylibName = "unknown";
9170 int Ordinal = Entry.other() - 1;
9171 Obj->getLibraryShortNameByIndex(Ordinal, DylibName);
9172 if (Entry.otherName().empty())
9173 outs() << " (from " << DylibName << ")";
9175 outs() << " (" << Entry.otherName() << " from " << DylibName << ")";
9181 //===----------------------------------------------------------------------===//
9182 // rebase table dumping
9183 //===----------------------------------------------------------------------===//
9188 SegInfo(const object::MachOObjectFile *Obj);
9190 StringRef segmentName(uint32_t SegIndex);
9191 StringRef sectionName(uint32_t SegIndex, uint64_t SegOffset);
9192 uint64_t address(uint32_t SegIndex, uint64_t SegOffset);
9193 bool isValidSegIndexAndOffset(uint32_t SegIndex, uint64_t SegOffset);
9196 struct SectionInfo {
9199 StringRef SectionName;
9200 StringRef SegmentName;
9201 uint64_t OffsetInSegment;
9202 uint64_t SegmentStartAddress;
9203 uint32_t SegmentIndex;
9205 const SectionInfo &findSection(uint32_t SegIndex, uint64_t SegOffset);
9206 SmallVector<SectionInfo, 32> Sections;
9210 SegInfo::SegInfo(const object::MachOObjectFile *Obj) {
9211 // Build table of sections so segIndex/offset pairs can be translated.
9212 uint32_t CurSegIndex = Obj->hasPageZeroSegment() ? 1 : 0;
9213 StringRef CurSegName;
9214 uint64_t CurSegAddress;
9215 for (const SectionRef &Section : Obj->sections()) {
9217 error(Section.getName(Info.SectionName));
9218 Info.Address = Section.getAddress();
9219 Info.Size = Section.getSize();
9221 Obj->getSectionFinalSegmentName(Section.getRawDataRefImpl());
9222 if (!Info.SegmentName.equals(CurSegName)) {
9224 CurSegName = Info.SegmentName;
9225 CurSegAddress = Info.Address;
9227 Info.SegmentIndex = CurSegIndex - 1;
9228 Info.OffsetInSegment = Info.Address - CurSegAddress;
9229 Info.SegmentStartAddress = CurSegAddress;
9230 Sections.push_back(Info);
9234 StringRef SegInfo::segmentName(uint32_t SegIndex) {
9235 for (const SectionInfo &SI : Sections) {
9236 if (SI.SegmentIndex == SegIndex)
9237 return SI.SegmentName;
9239 llvm_unreachable("invalid segIndex");
9242 bool SegInfo::isValidSegIndexAndOffset(uint32_t SegIndex,
9243 uint64_t OffsetInSeg) {
9244 for (const SectionInfo &SI : Sections) {
9245 if (SI.SegmentIndex != SegIndex)
9247 if (SI.OffsetInSegment > OffsetInSeg)
9249 if (OffsetInSeg >= (SI.OffsetInSegment + SI.Size))
9256 const SegInfo::SectionInfo &SegInfo::findSection(uint32_t SegIndex,
9257 uint64_t OffsetInSeg) {
9258 for (const SectionInfo &SI : Sections) {
9259 if (SI.SegmentIndex != SegIndex)
9261 if (SI.OffsetInSegment > OffsetInSeg)
9263 if (OffsetInSeg >= (SI.OffsetInSegment + SI.Size))
9267 llvm_unreachable("segIndex and offset not in any section");
9270 StringRef SegInfo::sectionName(uint32_t SegIndex, uint64_t OffsetInSeg) {
9271 return findSection(SegIndex, OffsetInSeg).SectionName;
9274 uint64_t SegInfo::address(uint32_t SegIndex, uint64_t OffsetInSeg) {
9275 const SectionInfo &SI = findSection(SegIndex, OffsetInSeg);
9276 return SI.SegmentStartAddress + OffsetInSeg;
9279 void llvm::printMachORebaseTable(const object::MachOObjectFile *Obj) {
9280 // Build table of sections so names can used in final output.
9281 SegInfo sectionTable(Obj);
9283 outs() << "segment section address type\n";
9284 for (const llvm::object::MachORebaseEntry &Entry : Obj->rebaseTable()) {
9285 uint32_t SegIndex = Entry.segmentIndex();
9286 uint64_t OffsetInSeg = Entry.segmentOffset();
9287 StringRef SegmentName = sectionTable.segmentName(SegIndex);
9288 StringRef SectionName = sectionTable.sectionName(SegIndex, OffsetInSeg);
9289 uint64_t Address = sectionTable.address(SegIndex, OffsetInSeg);
9291 // Table lines look like: __DATA __nl_symbol_ptr 0x0000F00C pointer
9292 outs() << format("%-8s %-18s 0x%08" PRIX64 " %s\n",
9293 SegmentName.str().c_str(), SectionName.str().c_str(),
9294 Address, Entry.typeName().str().c_str());
9298 static StringRef ordinalName(const object::MachOObjectFile *Obj, int Ordinal) {
9299 StringRef DylibName;
9301 case MachO::BIND_SPECIAL_DYLIB_SELF:
9302 return "this-image";
9303 case MachO::BIND_SPECIAL_DYLIB_MAIN_EXECUTABLE:
9304 return "main-executable";
9305 case MachO::BIND_SPECIAL_DYLIB_FLAT_LOOKUP:
9306 return "flat-namespace";
9309 std::error_code EC =
9310 Obj->getLibraryShortNameByIndex(Ordinal - 1, DylibName);
9312 return "<<bad library ordinal>>";
9316 return "<<unknown special ordinal>>";
9319 //===----------------------------------------------------------------------===//
9320 // bind table dumping
9321 //===----------------------------------------------------------------------===//
9323 void llvm::printMachOBindTable(const object::MachOObjectFile *Obj) {
9324 // Build table of sections so names can used in final output.
9325 SegInfo sectionTable(Obj);
9327 outs() << "segment section address type "
9328 "addend dylib symbol\n";
9329 for (const llvm::object::MachOBindEntry &Entry : Obj->bindTable()) {
9330 uint32_t SegIndex = Entry.segmentIndex();
9331 uint64_t OffsetInSeg = Entry.segmentOffset();
9332 StringRef SegmentName = sectionTable.segmentName(SegIndex);
9333 StringRef SectionName = sectionTable.sectionName(SegIndex, OffsetInSeg);
9334 uint64_t Address = sectionTable.address(SegIndex, OffsetInSeg);
9336 // Table lines look like:
9337 // __DATA __got 0x00012010 pointer 0 libSystem ___stack_chk_guard
9339 if (Entry.flags() & MachO::BIND_SYMBOL_FLAGS_WEAK_IMPORT)
9340 Attr = " (weak_import)";
9341 outs() << left_justify(SegmentName, 8) << " "
9342 << left_justify(SectionName, 18) << " "
9343 << format_hex(Address, 10, true) << " "
9344 << left_justify(Entry.typeName(), 8) << " "
9345 << format_decimal(Entry.addend(), 8) << " "
9346 << left_justify(ordinalName(Obj, Entry.ordinal()), 16) << " "
9347 << Entry.symbolName() << Attr << "\n";
9351 //===----------------------------------------------------------------------===//
9352 // lazy bind table dumping
9353 //===----------------------------------------------------------------------===//
9355 void llvm::printMachOLazyBindTable(const object::MachOObjectFile *Obj) {
9356 // Build table of sections so names can used in final output.
9357 SegInfo sectionTable(Obj);
9359 outs() << "segment section address "
9361 for (const llvm::object::MachOBindEntry &Entry : Obj->lazyBindTable()) {
9362 uint32_t SegIndex = Entry.segmentIndex();
9363 uint64_t OffsetInSeg = Entry.segmentOffset();
9364 StringRef SegmentName = sectionTable.segmentName(SegIndex);
9365 StringRef SectionName = sectionTable.sectionName(SegIndex, OffsetInSeg);
9366 uint64_t Address = sectionTable.address(SegIndex, OffsetInSeg);
9368 // Table lines look like:
9369 // __DATA __got 0x00012010 libSystem ___stack_chk_guard
9370 outs() << left_justify(SegmentName, 8) << " "
9371 << left_justify(SectionName, 18) << " "
9372 << format_hex(Address, 10, true) << " "
9373 << left_justify(ordinalName(Obj, Entry.ordinal()), 16) << " "
9374 << Entry.symbolName() << "\n";
9378 //===----------------------------------------------------------------------===//
9379 // weak bind table dumping
9380 //===----------------------------------------------------------------------===//
9382 void llvm::printMachOWeakBindTable(const object::MachOObjectFile *Obj) {
9383 // Build table of sections so names can used in final output.
9384 SegInfo sectionTable(Obj);
9386 outs() << "segment section address "
9387 "type addend symbol\n";
9388 for (const llvm::object::MachOBindEntry &Entry : Obj->weakBindTable()) {
9389 // Strong symbols don't have a location to update.
9390 if (Entry.flags() & MachO::BIND_SYMBOL_FLAGS_NON_WEAK_DEFINITION) {
9391 outs() << " strong "
9392 << Entry.symbolName() << "\n";
9395 uint32_t SegIndex = Entry.segmentIndex();
9396 uint64_t OffsetInSeg = Entry.segmentOffset();
9397 StringRef SegmentName = sectionTable.segmentName(SegIndex);
9398 StringRef SectionName = sectionTable.sectionName(SegIndex, OffsetInSeg);
9399 uint64_t Address = sectionTable.address(SegIndex, OffsetInSeg);
9401 // Table lines look like:
9402 // __DATA __data 0x00001000 pointer 0 _foo
9403 outs() << left_justify(SegmentName, 8) << " "
9404 << left_justify(SectionName, 18) << " "
9405 << format_hex(Address, 10, true) << " "
9406 << left_justify(Entry.typeName(), 8) << " "
9407 << format_decimal(Entry.addend(), 8) << " " << Entry.symbolName()
9412 // get_dyld_bind_info_symbolname() is used for disassembly and passed an
9413 // address, ReferenceValue, in the Mach-O file and looks in the dyld bind
9414 // information for that address. If the address is found its binding symbol
9415 // name is returned. If not nullptr is returned.
9416 static const char *get_dyld_bind_info_symbolname(uint64_t ReferenceValue,
9417 struct DisassembleInfo *info) {
9418 if (info->bindtable == nullptr) {
9419 info->bindtable = llvm::make_unique<SymbolAddressMap>();
9420 SegInfo sectionTable(info->O);
9421 for (const llvm::object::MachOBindEntry &Entry : info->O->bindTable()) {
9422 uint32_t SegIndex = Entry.segmentIndex();
9423 uint64_t OffsetInSeg = Entry.segmentOffset();
9424 if (!sectionTable.isValidSegIndexAndOffset(SegIndex, OffsetInSeg))
9426 uint64_t Address = sectionTable.address(SegIndex, OffsetInSeg);
9427 StringRef name = Entry.symbolName();
9429 (*info->bindtable)[Address] = name;
9432 auto name = info->bindtable->lookup(ReferenceValue);
9433 return !name.empty() ? name.data() : nullptr;