1 //===- DWARFContext.cpp ---------------------------------------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 #include "llvm/DebugInfo/DWARF/DWARFContext.h"
11 #include "llvm/ADT/STLExtras.h"
12 #include "llvm/ADT/SmallString.h"
13 #include "llvm/ADT/SmallVector.h"
14 #include "llvm/ADT/StringRef.h"
15 #include "llvm/ADT/StringSwitch.h"
16 #include "llvm/DebugInfo/DWARF/DWARFAcceleratorTable.h"
17 #include "llvm/DebugInfo/DWARF/DWARFCompileUnit.h"
18 #include "llvm/DebugInfo/DWARF/DWARFDebugAbbrev.h"
19 #include "llvm/DebugInfo/DWARF/DWARFDebugArangeSet.h"
20 #include "llvm/DebugInfo/DWARF/DWARFDebugAranges.h"
21 #include "llvm/DebugInfo/DWARF/DWARFDebugFrame.h"
22 #include "llvm/DebugInfo/DWARF/DWARFDebugLine.h"
23 #include "llvm/DebugInfo/DWARF/DWARFDebugLoc.h"
24 #include "llvm/DebugInfo/DWARF/DWARFDebugMacro.h"
25 #include "llvm/DebugInfo/DWARF/DWARFDebugPubTable.h"
26 #include "llvm/DebugInfo/DWARF/DWARFDebugRangeList.h"
27 #include "llvm/DebugInfo/DWARF/DWARFDie.h"
28 #include "llvm/DebugInfo/DWARF/DWARFFormValue.h"
29 #include "llvm/DebugInfo/DWARF/DWARFGdbIndex.h"
30 #include "llvm/DebugInfo/DWARF/DWARFSection.h"
31 #include "llvm/DebugInfo/DWARF/DWARFUnitIndex.h"
32 #include "llvm/DebugInfo/DWARF/DWARFVerifier.h"
33 #include "llvm/Object/Decompressor.h"
34 #include "llvm/Object/MachO.h"
35 #include "llvm/Object/ObjectFile.h"
36 #include "llvm/Object/RelocVisitor.h"
37 #include "llvm/Support/Casting.h"
38 #include "llvm/Support/DataExtractor.h"
39 #include "llvm/Support/Debug.h"
40 #include "llvm/Support/Error.h"
41 #include "llvm/Support/Format.h"
42 #include "llvm/Support/MemoryBuffer.h"
43 #include "llvm/Support/raw_ostream.h"
53 using namespace dwarf;
54 using namespace object;
56 #define DEBUG_TYPE "dwarf"
58 typedef DWARFDebugLine::LineTable DWARFLineTable;
59 typedef DILineInfoSpecifier::FileLineInfoKind FileLineInfoKind;
60 typedef DILineInfoSpecifier::FunctionNameKind FunctionNameKind;
62 uint64_t llvm::getRelocatedValue(const DataExtractor &Data, uint32_t Size,
63 uint32_t *Off, const RelocAddrMap *Relocs,
64 uint64_t *SectionIndex) {
66 return Data.getUnsigned(Off, Size);
67 RelocAddrMap::const_iterator AI = Relocs->find(*Off);
68 if (AI == Relocs->end())
69 return Data.getUnsigned(Off, Size);
71 *SectionIndex = AI->second.SectionIndex;
72 return Data.getUnsigned(Off, Size) + AI->second.Value;
75 static void dumpAccelSection(raw_ostream &OS, StringRef Name,
76 const DWARFSection& Section, StringRef StringSection,
78 DataExtractor AccelSection(Section.Data, LittleEndian, 0);
79 DataExtractor StrData(StringSection, LittleEndian, 0);
80 OS << "\n." << Name << " contents:\n";
81 DWARFAcceleratorTable Accel(AccelSection, StrData, Section.Relocs);
88 dumpDWARFv5StringOffsetsSection(raw_ostream &OS, StringRef SectionName,
89 const DWARFSection &StringOffsetsSection,
90 StringRef StringSection, bool LittleEndian) {
91 DataExtractor StrOffsetExt(StringOffsetsSection.Data, LittleEndian, 0);
93 uint64_t SectionSize = StringOffsetsSection.Data.size();
95 while (Offset < SectionSize) {
97 DwarfFormat Format = DWARF32;
98 unsigned EntrySize = 4;
99 // Perform validation and extract the segment size from the header.
100 if (!StrOffsetExt.isValidOffsetForDataOfSize(Offset, 4)) {
101 OS << "error: invalid contribution to string offsets table in section ."
102 << SectionName << ".\n";
105 uint32_t ContributionStart = Offset;
106 uint64_t ContributionSize = StrOffsetExt.getU32(&Offset);
107 // A contribution size of 0xffffffff indicates DWARF64, with the actual size
108 // in the following 8 bytes. Otherwise, the DWARF standard mandates that
109 // the contribution size must be at most 0xfffffff0.
110 if (ContributionSize == 0xffffffff) {
111 if (!StrOffsetExt.isValidOffsetForDataOfSize(Offset, 8)) {
112 OS << "error: invalid contribution to string offsets table in section ."
113 << SectionName << ".\n";
118 ContributionSize = StrOffsetExt.getU64(&Offset);
119 } else if (ContributionSize > 0xfffffff0) {
120 OS << "error: invalid contribution to string offsets table in section ."
121 << SectionName << ".\n";
125 // We must ensure that we don't read a partial record at the end, so we
126 // validate for a multiple of EntrySize. Also, we're expecting a version
127 // number and padding, which adds an additional 4 bytes.
128 uint64_t ValidationSize =
129 4 + ((ContributionSize + EntrySize - 1) & (-(uint64_t)EntrySize));
130 if (!StrOffsetExt.isValidOffsetForDataOfSize(Offset, ValidationSize)) {
131 OS << "error: contribution to string offsets table in section ."
132 << SectionName << " has invalid length.\n";
136 Version = StrOffsetExt.getU16(&Offset);
138 OS << format("0x%8.8x: ", ContributionStart);
139 OS << "Contribution size = " << ContributionSize
140 << ", Version = " << Version << "\n";
142 uint32_t ContributionBase = Offset;
143 DataExtractor StrData(StringSection, LittleEndian, 0);
144 while (Offset - ContributionBase < ContributionSize) {
145 OS << format("0x%8.8x: ", Offset);
146 // FIXME: We can only extract strings in DWARF32 format at the moment.
147 uint64_t StringOffset = getRelocatedValue(
148 StrOffsetExt, EntrySize, &Offset, &StringOffsetsSection.Relocs);
149 if (Format == DWARF32) {
150 OS << format("%8.8x ", StringOffset);
151 uint32_t StringOffset32 = (uint32_t)StringOffset;
152 const char *S = StrData.getCStr(&StringOffset32);
154 OS << format("\"%s\"", S);
156 OS << format("%16.16x ", StringOffset);
162 // Dump a DWARF string offsets section. This may be a DWARF v5 formatted
163 // string offsets section, where each compile or type unit contributes a
164 // number of entries (string offsets), with each contribution preceded by
165 // a header containing size and version number. Alternatively, it may be a
166 // monolithic series of string offsets, as generated by the pre-DWARF v5
167 // implementation of split DWARF.
168 static void dumpStringOffsetsSection(raw_ostream &OS, StringRef SectionName,
169 const DWARFSection &StringOffsetsSection,
170 StringRef StringSection, bool LittleEndian,
171 unsigned MaxVersion) {
172 if (StringOffsetsSection.Data.empty())
174 OS << "\n." << SectionName << " contents:\n";
175 // If we have at least one (compile or type) unit with DWARF v5 or greater,
176 // we assume that the section is formatted like a DWARF v5 string offsets
179 dumpDWARFv5StringOffsetsSection(OS, SectionName, StringOffsetsSection,
180 StringSection, LittleEndian);
182 DataExtractor strOffsetExt(StringOffsetsSection.Data, LittleEndian, 0);
184 uint64_t size = StringOffsetsSection.Data.size();
185 // Ensure that size is a multiple of the size of an entry.
186 if (size & ((uint64_t)(sizeof(uint32_t) - 1))) {
187 OS << "error: size of ." << SectionName << " is not a multiple of "
188 << sizeof(uint32_t) << ".\n";
189 size &= -(uint64_t)sizeof(uint32_t);
191 DataExtractor StrData(StringSection, LittleEndian, 0);
192 while (offset < size) {
193 OS << format("0x%8.8x: ", offset);
194 uint32_t StringOffset = strOffsetExt.getU32(&offset);
195 OS << format("%8.8x ", StringOffset);
196 const char *S = StrData.getCStr(&StringOffset);
198 OS << format("\"%s\"", S);
204 void DWARFContext::dump(raw_ostream &OS, DIDumpOptions DumpOpts){
206 DIDumpType DumpType = DumpOpts.DumpType;
207 bool DumpEH = DumpOpts.DumpEH;
208 bool SummarizeTypes = DumpOpts.SummarizeTypes;
210 if (DumpType == DIDT_All || DumpType == DIDT_Abbrev) {
211 OS << ".debug_abbrev contents:\n";
212 getDebugAbbrev()->dump(OS);
215 if (DumpType == DIDT_All || DumpType == DIDT_AbbrevDwo)
216 if (const DWARFDebugAbbrev *D = getDebugAbbrevDWO()) {
217 OS << "\n.debug_abbrev.dwo contents:\n";
221 if (DumpType == DIDT_All || DumpType == DIDT_Info) {
222 OS << "\n.debug_info contents:\n";
223 for (const auto &CU : compile_units())
224 CU->dump(OS, DumpOpts);
227 if ((DumpType == DIDT_All || DumpType == DIDT_InfoDwo) &&
228 getNumDWOCompileUnits()) {
229 OS << "\n.debug_info.dwo contents:\n";
230 for (const auto &DWOCU : dwo_compile_units())
231 DWOCU->dump(OS, DumpOpts);
234 if ((DumpType == DIDT_All || DumpType == DIDT_Types) && getNumTypeUnits()) {
235 OS << "\n.debug_types contents:\n";
236 for (const auto &TUS : type_unit_sections())
237 for (const auto &TU : TUS)
238 TU->dump(OS, SummarizeTypes);
241 if ((DumpType == DIDT_All || DumpType == DIDT_TypesDwo) &&
242 getNumDWOTypeUnits()) {
243 OS << "\n.debug_types.dwo contents:\n";
244 for (const auto &DWOTUS : dwo_type_unit_sections())
245 for (const auto &DWOTU : DWOTUS)
246 DWOTU->dump(OS, SummarizeTypes);
249 if (DumpType == DIDT_All || DumpType == DIDT_Loc) {
250 OS << "\n.debug_loc contents:\n";
251 getDebugLoc()->dump(OS);
254 if (DumpType == DIDT_All || DumpType == DIDT_LocDwo) {
255 OS << "\n.debug_loc.dwo contents:\n";
256 getDebugLocDWO()->dump(OS);
259 if (DumpType == DIDT_All || DumpType == DIDT_Frames) {
260 OS << "\n.debug_frame contents:\n";
261 getDebugFrame()->dump(OS);
263 OS << "\n.eh_frame contents:\n";
264 getEHFrame()->dump(OS);
268 if (DumpType == DIDT_All || DumpType == DIDT_Macro) {
269 OS << "\n.debug_macinfo contents:\n";
270 getDebugMacro()->dump(OS);
274 if (DumpType == DIDT_All || DumpType == DIDT_Aranges) {
275 OS << "\n.debug_aranges contents:\n";
276 DataExtractor arangesData(getARangeSection(), isLittleEndian(), 0);
277 DWARFDebugArangeSet set;
278 while (set.extract(arangesData, &offset))
282 uint8_t savedAddressByteSize = 0;
283 if (DumpType == DIDT_All || DumpType == DIDT_Line) {
284 OS << "\n.debug_line contents:\n";
285 for (const auto &CU : compile_units()) {
286 savedAddressByteSize = CU->getAddressByteSize();
287 auto CUDIE = CU->getUnitDIE();
290 if (auto StmtOffset = toSectionOffset(CUDIE.find(DW_AT_stmt_list))) {
291 DataExtractor lineData(getLineSection().Data, isLittleEndian(),
292 savedAddressByteSize);
293 DWARFDebugLine::LineTable LineTable;
294 uint32_t Offset = *StmtOffset;
295 LineTable.parse(lineData, &getLineSection().Relocs, &Offset);
301 if (DumpType == DIDT_All || DumpType == DIDT_CUIndex) {
302 OS << "\n.debug_cu_index contents:\n";
303 getCUIndex().dump(OS);
306 if (DumpType == DIDT_All || DumpType == DIDT_TUIndex) {
307 OS << "\n.debug_tu_index contents:\n";
308 getTUIndex().dump(OS);
311 if (DumpType == DIDT_All || DumpType == DIDT_LineDwo) {
312 OS << "\n.debug_line.dwo contents:\n";
313 unsigned stmtOffset = 0;
314 DataExtractor lineData(getLineDWOSection().Data, isLittleEndian(),
315 savedAddressByteSize);
316 DWARFDebugLine::LineTable LineTable;
317 while (LineTable.Prologue.parse(lineData, &stmtOffset)) {
323 if (DumpType == DIDT_All || DumpType == DIDT_Str) {
324 OS << "\n.debug_str contents:\n";
325 DataExtractor strData(getStringSection(), isLittleEndian(), 0);
327 uint32_t strOffset = 0;
328 while (const char *s = strData.getCStr(&offset)) {
329 OS << format("0x%8.8x: \"%s\"\n", strOffset, s);
334 if ((DumpType == DIDT_All || DumpType == DIDT_StrDwo) &&
335 !getStringDWOSection().empty()) {
336 OS << "\n.debug_str.dwo contents:\n";
337 DataExtractor strDWOData(getStringDWOSection(), isLittleEndian(), 0);
339 uint32_t strDWOOffset = 0;
340 while (const char *s = strDWOData.getCStr(&offset)) {
341 OS << format("0x%8.8x: \"%s\"\n", strDWOOffset, s);
342 strDWOOffset = offset;
346 if (DumpType == DIDT_All || DumpType == DIDT_Ranges) {
347 OS << "\n.debug_ranges contents:\n";
348 // In fact, different compile units may have different address byte
349 // sizes, but for simplicity we just use the address byte size of the last
350 // compile unit (there is no easy and fast way to associate address range
351 // list and the compile unit it describes).
352 DataExtractor rangesData(getRangeSection().Data, isLittleEndian(),
353 savedAddressByteSize);
355 DWARFDebugRangeList rangeList;
356 while (rangeList.extract(rangesData, &offset, getRangeSection().Relocs))
360 if (DumpType == DIDT_All || DumpType == DIDT_Pubnames)
361 DWARFDebugPubTable(getPubNamesSection(), isLittleEndian(), false)
362 .dump("debug_pubnames", OS);
364 if (DumpType == DIDT_All || DumpType == DIDT_Pubtypes)
365 DWARFDebugPubTable(getPubTypesSection(), isLittleEndian(), false)
366 .dump("debug_pubtypes", OS);
368 if (DumpType == DIDT_All || DumpType == DIDT_GnuPubnames)
369 DWARFDebugPubTable(getGnuPubNamesSection(), isLittleEndian(),
371 .dump("debug_gnu_pubnames", OS);
373 if (DumpType == DIDT_All || DumpType == DIDT_GnuPubtypes)
374 DWARFDebugPubTable(getGnuPubTypesSection(), isLittleEndian(),
376 .dump("debug_gnu_pubtypes", OS);
378 if (DumpType == DIDT_All || DumpType == DIDT_StrOffsets)
379 dumpStringOffsetsSection(OS, "debug_str_offsets", getStringOffsetSection(),
380 getStringSection(), isLittleEndian(),
383 if (DumpType == DIDT_All || DumpType == DIDT_StrOffsetsDwo) {
384 dumpStringOffsetsSection(OS, "debug_str_offsets.dwo",
385 getStringOffsetDWOSection(), getStringDWOSection(),
386 isLittleEndian(), getMaxVersion());
389 if ((DumpType == DIDT_All || DumpType == DIDT_GdbIndex) &&
390 !getGdbIndexSection().empty()) {
391 OS << "\n.gnu_index contents:\n";
392 getGdbIndex().dump(OS);
395 if (DumpType == DIDT_All || DumpType == DIDT_AppleNames)
396 dumpAccelSection(OS, "apple_names", getAppleNamesSection(),
397 getStringSection(), isLittleEndian());
399 if (DumpType == DIDT_All || DumpType == DIDT_AppleTypes)
400 dumpAccelSection(OS, "apple_types", getAppleTypesSection(),
401 getStringSection(), isLittleEndian());
403 if (DumpType == DIDT_All || DumpType == DIDT_AppleNamespaces)
404 dumpAccelSection(OS, "apple_namespaces", getAppleNamespacesSection(),
405 getStringSection(), isLittleEndian());
407 if (DumpType == DIDT_All || DumpType == DIDT_AppleObjC)
408 dumpAccelSection(OS, "apple_objc", getAppleObjCSection(),
409 getStringSection(), isLittleEndian());
412 DWARFCompileUnit *DWARFContext::getDWOCompileUnitForHash(uint64_t Hash) {
413 // FIXME: Improve this for the case where this DWO file is really a DWP file
414 // with an index - use the index for lookup instead of a linear search.
415 for (const auto &DWOCU : dwo_compile_units())
416 if (DWOCU->getDWOId() == Hash)
421 DWARFDie DWARFContext::getDIEForOffset(uint32_t Offset) {
423 if (auto *CU = CUs.getUnitForOffset(Offset))
424 return CU->getDIEForOffset(Offset);
434 Verifier(raw_ostream &S, DWARFContext &D) : OS(S), DCtx(D) {}
436 bool HandleDebugInfo() {
438 // A map that tracks all references (converted absolute references) so we
439 // can verify each reference points to a valid DIE and not an offset that
440 // lies between to valid DIEs.
441 std::map<uint64_t, std::set<uint32_t>> ReferenceToDIEOffsets;
443 OS << "Verifying .debug_info...\n";
444 for (const auto &CU : DCtx.compile_units()) {
445 unsigned NumDies = CU->getNumDIEs();
446 for (unsigned I = 0; I < NumDies; ++I) {
447 auto Die = CU->getDIEAtIndex(I);
448 const auto Tag = Die.getTag();
449 if (Tag == DW_TAG_null)
451 for (auto AttrValue : Die.attributes()) {
452 const auto Attr = AttrValue.Attr;
453 const auto Form = AttrValue.Value.getForm();
456 // Make sure the offset in the DW_AT_ranges attribute is valid.
457 if (auto SectionOffset = AttrValue.Value.getAsSectionOffset()) {
458 if (*SectionOffset >= DCtx.getRangeSection().Data.size()) {
460 OS << "error: DW_AT_ranges offset is beyond .debug_ranges "
467 OS << "error: DIE has invalid DW_AT_ranges encoding:\n";
472 case DW_AT_stmt_list:
473 // Make sure the offset in the DW_AT_stmt_list attribute is valid.
474 if (auto SectionOffset = AttrValue.Value.getAsSectionOffset()) {
475 if (*SectionOffset >= DCtx.getLineSection().Data.size()) {
477 OS << "error: DW_AT_stmt_list offset is beyond .debug_line "
479 << format("0x%08" PRIx32, *SectionOffset) << "\n";
480 CU->getUnitDIE().dump(OS, 0);
485 OS << "error: DIE has invalid DW_AT_stmt_list encoding:\n";
499 case DW_FORM_ref_udata: {
500 // Verify all CU relative references are valid CU offsets.
501 Optional<uint64_t> RefVal = AttrValue.Value.getAsReference();
504 auto DieCU = Die.getDwarfUnit();
505 auto CUSize = DieCU->getNextUnitOffset() - DieCU->getOffset();
506 auto CUOffset = AttrValue.Value.getRawUValue();
507 if (CUOffset >= CUSize) {
509 OS << "error: " << FormEncodingString(Form) << " CU offset "
510 << format("0x%08" PRIx32, CUOffset)
511 << " is invalid (must be less than CU size of "
512 << format("0x%08" PRIx32, CUSize) << "):\n";
516 // Valid reference, but we will verify it points to an actual
518 ReferenceToDIEOffsets[*RefVal].insert(Die.getOffset());
523 case DW_FORM_ref_addr: {
524 // Verify all absolute DIE references have valid offsets in the
525 // .debug_info section.
526 Optional<uint64_t> RefVal = AttrValue.Value.getAsReference();
529 if(*RefVal >= DCtx.getInfoSection().Data.size()) {
531 OS << "error: DW_FORM_ref_addr offset beyond .debug_info "
536 // Valid reference, but we will verify it points to an actual
538 ReferenceToDIEOffsets[*RefVal].insert(Die.getOffset());
544 auto SecOffset = AttrValue.Value.getAsSectionOffset();
545 assert(SecOffset); // DW_FORM_strp is a section offset.
546 if (SecOffset && *SecOffset >= DCtx.getStringSection().size()) {
548 OS << "error: DW_FORM_strp offset beyond .debug_str bounds:\n";
561 // Take all references and make sure they point to an actual DIE by
562 // getting the DIE by offset and emitting an error
563 OS << "Verifying .debug_info references...\n";
564 for (auto Pair: ReferenceToDIEOffsets) {
565 auto Die = DCtx.getDIEForOffset(Pair.first);
569 OS << "error: invalid DIE reference " << format("0x%08" PRIx64, Pair.first)
570 << ". Offset is in between DIEs:\n";
571 for (auto Offset: Pair.second) {
572 auto ReferencingDie = DCtx.getDIEForOffset(Offset);
573 ReferencingDie.dump(OS, 0);
581 bool HandleDebugLine() {
582 std::map<uint64_t, DWARFDie> StmtListToDie;
584 OS << "Verifying .debug_line...\n";
585 for (const auto &CU : DCtx.compile_units()) {
586 uint32_t LineTableOffset = 0;
587 auto CUDie = CU->getUnitDIE();
588 auto StmtFormValue = CUDie.find(DW_AT_stmt_list);
589 if (!StmtFormValue) {
590 // No line table for this compile unit.
593 // Get the attribute value as a section offset. No need to produce an
594 // error here if the encoding isn't correct because we validate this in
595 // the .debug_info verifier.
596 if (auto StmtSectionOffset = toSectionOffset(StmtFormValue)) {
597 LineTableOffset = *StmtSectionOffset;
598 if (LineTableOffset >= DCtx.getLineSection().Data.size()) {
599 // Make sure we don't get a valid line table back if the offset
601 assert(DCtx.getLineTableForUnit(CU.get()) == nullptr);
602 // Skip this line table as it isn't valid. No need to create an error
603 // here because we validate this in the .debug_info verifier.
606 auto Iter = StmtListToDie.find(LineTableOffset);
607 if (Iter != StmtListToDie.end()) {
609 OS << "error: two compile unit DIEs, "
610 << format("0x%08" PRIx32, Iter->second.getOffset()) << " and "
611 << format("0x%08" PRIx32, CUDie.getOffset())
612 << ", have the same DW_AT_stmt_list section offset:\n";
613 Iter->second.dump(OS, 0);
616 // Already verified this line table before, no need to do it again.
619 StmtListToDie[LineTableOffset] = CUDie;
622 auto LineTable = DCtx.getLineTableForUnit(CU.get());
625 OS << "error: .debug_line[" << format("0x%08" PRIx32, LineTableOffset)
626 << "] was not able to be parsed for CU:\n";
631 uint32_t MaxFileIndex = LineTable->Prologue.FileNames.size();
632 uint64_t PrevAddress = 0;
633 uint32_t RowIndex = 0;
634 for (const auto &Row : LineTable->Rows) {
635 if (Row.Address < PrevAddress) {
637 OS << "error: .debug_line[" << format("0x%08" PRIx32, LineTableOffset)
638 << "] row[" << RowIndex
639 << "] decreases in address from previous row:\n";
641 DWARFDebugLine::Row::dumpTableHeader(OS);
643 LineTable->Rows[RowIndex - 1].dump(OS);
648 if (Row.File > MaxFileIndex) {
650 OS << "error: .debug_line[" << format("0x%08" PRIx32, LineTableOffset)
651 << "][" << RowIndex << "] has invalid file index " << Row.File
652 << " (valid values are [1," << MaxFileIndex << "]):\n";
653 DWARFDebugLine::Row::dumpTableHeader(OS);
660 PrevAddress = Row.Address;
668 } // anonymous namespace
670 bool DWARFContext::verify(raw_ostream &OS, DIDumpType DumpType) {
672 DWARFVerifier verifier(OS, *this);
673 if (DumpType == DIDT_All || DumpType == DIDT_Info) {
674 if (!verifier.handleDebugInfo())
677 if (DumpType == DIDT_All || DumpType == DIDT_Line) {
678 if (!verifier.handleDebugLine())
683 const DWARFUnitIndex &DWARFContext::getCUIndex() {
687 DataExtractor CUIndexData(getCUIndexSection(), isLittleEndian(), 0);
689 CUIndex = llvm::make_unique<DWARFUnitIndex>(DW_SECT_INFO);
690 CUIndex->parse(CUIndexData);
694 const DWARFUnitIndex &DWARFContext::getTUIndex() {
698 DataExtractor TUIndexData(getTUIndexSection(), isLittleEndian(), 0);
700 TUIndex = llvm::make_unique<DWARFUnitIndex>(DW_SECT_TYPES);
701 TUIndex->parse(TUIndexData);
705 DWARFGdbIndex &DWARFContext::getGdbIndex() {
709 DataExtractor GdbIndexData(getGdbIndexSection(), true /*LE*/, 0);
710 GdbIndex = llvm::make_unique<DWARFGdbIndex>();
711 GdbIndex->parse(GdbIndexData);
715 const DWARFDebugAbbrev *DWARFContext::getDebugAbbrev() {
719 DataExtractor abbrData(getAbbrevSection(), isLittleEndian(), 0);
721 Abbrev.reset(new DWARFDebugAbbrev());
722 Abbrev->extract(abbrData);
726 const DWARFDebugAbbrev *DWARFContext::getDebugAbbrevDWO() {
728 return AbbrevDWO.get();
730 DataExtractor abbrData(getAbbrevDWOSection(), isLittleEndian(), 0);
731 AbbrevDWO.reset(new DWARFDebugAbbrev());
732 AbbrevDWO->extract(abbrData);
733 return AbbrevDWO.get();
736 const DWARFDebugLoc *DWARFContext::getDebugLoc() {
740 DataExtractor LocData(getLocSection().Data, isLittleEndian(), 0);
741 Loc.reset(new DWARFDebugLoc(getLocSection().Relocs));
742 // assume all compile units have the same address byte size
743 if (getNumCompileUnits())
744 Loc->parse(LocData, getCompileUnitAtIndex(0)->getAddressByteSize());
748 const DWARFDebugLocDWO *DWARFContext::getDebugLocDWO() {
752 DataExtractor LocData(getLocDWOSection().Data, isLittleEndian(), 0);
753 LocDWO.reset(new DWARFDebugLocDWO());
754 LocDWO->parse(LocData);
758 const DWARFDebugAranges *DWARFContext::getDebugAranges() {
760 return Aranges.get();
762 Aranges.reset(new DWARFDebugAranges());
763 Aranges->generate(this);
764 return Aranges.get();
767 const DWARFDebugFrame *DWARFContext::getDebugFrame() {
769 return DebugFrame.get();
771 // There's a "bug" in the DWARFv3 standard with respect to the target address
772 // size within debug frame sections. While DWARF is supposed to be independent
773 // of its container, FDEs have fields with size being "target address size",
774 // which isn't specified in DWARF in general. It's only specified for CUs, but
775 // .eh_frame can appear without a .debug_info section. Follow the example of
776 // other tools (libdwarf) and extract this from the container (ObjectFile
777 // provides this information). This problem is fixed in DWARFv4
778 // See this dwarf-discuss discussion for more details:
779 // http://lists.dwarfstd.org/htdig.cgi/dwarf-discuss-dwarfstd.org/2011-December/001173.html
780 DataExtractor debugFrameData(getDebugFrameSection(), isLittleEndian(),
782 DebugFrame.reset(new DWARFDebugFrame(false /* IsEH */));
783 DebugFrame->parse(debugFrameData);
784 return DebugFrame.get();
787 const DWARFDebugFrame *DWARFContext::getEHFrame() {
789 return EHFrame.get();
791 DataExtractor debugFrameData(getEHFrameSection(), isLittleEndian(),
793 DebugFrame.reset(new DWARFDebugFrame(true /* IsEH */));
794 DebugFrame->parse(debugFrameData);
795 return DebugFrame.get();
798 const DWARFDebugMacro *DWARFContext::getDebugMacro() {
802 DataExtractor MacinfoData(getMacinfoSection(), isLittleEndian(), 0);
803 Macro.reset(new DWARFDebugMacro());
804 Macro->parse(MacinfoData);
808 const DWARFLineTable *
809 DWARFContext::getLineTableForUnit(DWARFUnit *U) {
811 Line.reset(new DWARFDebugLine(&getLineSection().Relocs));
813 auto UnitDIE = U->getUnitDIE();
817 auto Offset = toSectionOffset(UnitDIE.find(DW_AT_stmt_list));
819 return nullptr; // No line table for this compile unit.
821 uint32_t stmtOffset = *Offset + U->getLineTableOffset();
822 // See if the line table is cached.
823 if (const DWARFLineTable *lt = Line->getLineTable(stmtOffset))
826 // Make sure the offset is good before we try to parse.
827 if (stmtOffset >= U->getLineSection().size())
830 // We have to parse it first.
831 DataExtractor lineData(U->getLineSection(), isLittleEndian(),
832 U->getAddressByteSize());
833 return Line->getOrParseLineTable(lineData, stmtOffset);
836 void DWARFContext::parseCompileUnits() {
837 CUs.parse(*this, getInfoSection());
840 void DWARFContext::parseTypeUnits() {
843 for (const auto &I : getTypesSections()) {
845 TUs.back().parse(*this, I.second);
849 void DWARFContext::parseDWOCompileUnits() {
850 DWOCUs.parseDWO(*this, getInfoDWOSection());
853 void DWARFContext::parseDWOTypeUnits() {
856 for (const auto &I : getTypesDWOSections()) {
857 DWOTUs.emplace_back();
858 DWOTUs.back().parseDWO(*this, I.second);
862 DWARFCompileUnit *DWARFContext::getCompileUnitForOffset(uint32_t Offset) {
864 return CUs.getUnitForOffset(Offset);
867 DWARFCompileUnit *DWARFContext::getCompileUnitForAddress(uint64_t Address) {
868 // First, get the offset of the compile unit.
869 uint32_t CUOffset = getDebugAranges()->findAddress(Address);
870 // Retrieve the compile unit.
871 return getCompileUnitForOffset(CUOffset);
874 static bool getFunctionNameAndStartLineForAddress(DWARFCompileUnit *CU,
876 FunctionNameKind Kind,
877 std::string &FunctionName,
878 uint32_t &StartLine) {
879 // The address may correspond to instruction in some inlined function,
880 // so we have to build the chain of inlined functions and take the
881 // name of the topmost function in it.
882 SmallVector<DWARFDie, 4> InlinedChain;
883 CU->getInlinedChainForAddress(Address, InlinedChain);
884 if (InlinedChain.empty())
887 const DWARFDie &DIE = InlinedChain[0];
888 bool FoundResult = false;
889 const char *Name = nullptr;
890 if (Kind != FunctionNameKind::None && (Name = DIE.getSubroutineName(Kind))) {
894 if (auto DeclLineResult = DIE.getDeclLine()) {
895 StartLine = DeclLineResult;
902 DILineInfo DWARFContext::getLineInfoForAddress(uint64_t Address,
903 DILineInfoSpecifier Spec) {
906 DWARFCompileUnit *CU = getCompileUnitForAddress(Address);
909 getFunctionNameAndStartLineForAddress(CU, Address, Spec.FNKind,
912 if (Spec.FLIKind != FileLineInfoKind::None) {
913 if (const DWARFLineTable *LineTable = getLineTableForUnit(CU))
914 LineTable->getFileLineInfoForAddress(Address, CU->getCompilationDir(),
915 Spec.FLIKind, Result);
921 DWARFContext::getLineInfoForAddressRange(uint64_t Address, uint64_t Size,
922 DILineInfoSpecifier Spec) {
923 DILineInfoTable Lines;
924 DWARFCompileUnit *CU = getCompileUnitForAddress(Address);
928 std::string FunctionName = "<invalid>";
929 uint32_t StartLine = 0;
930 getFunctionNameAndStartLineForAddress(CU, Address, Spec.FNKind, FunctionName,
933 // If the Specifier says we don't need FileLineInfo, just
934 // return the top-most function at the starting address.
935 if (Spec.FLIKind == FileLineInfoKind::None) {
937 Result.FunctionName = FunctionName;
938 Result.StartLine = StartLine;
939 Lines.push_back(std::make_pair(Address, Result));
943 const DWARFLineTable *LineTable = getLineTableForUnit(CU);
945 // Get the index of row we're looking for in the line table.
946 std::vector<uint32_t> RowVector;
947 if (!LineTable->lookupAddressRange(Address, Size, RowVector))
950 for (uint32_t RowIndex : RowVector) {
951 // Take file number and line/column from the row.
952 const DWARFDebugLine::Row &Row = LineTable->Rows[RowIndex];
954 LineTable->getFileNameByIndex(Row.File, CU->getCompilationDir(),
955 Spec.FLIKind, Result.FileName);
956 Result.FunctionName = FunctionName;
957 Result.Line = Row.Line;
958 Result.Column = Row.Column;
959 Result.StartLine = StartLine;
960 Lines.push_back(std::make_pair(Row.Address, Result));
967 DWARFContext::getInliningInfoForAddress(uint64_t Address,
968 DILineInfoSpecifier Spec) {
969 DIInliningInfo InliningInfo;
971 DWARFCompileUnit *CU = getCompileUnitForAddress(Address);
975 const DWARFLineTable *LineTable = nullptr;
976 SmallVector<DWARFDie, 4> InlinedChain;
977 CU->getInlinedChainForAddress(Address, InlinedChain);
978 if (InlinedChain.size() == 0) {
979 // If there is no DIE for address (e.g. it is in unavailable .dwo file),
980 // try to at least get file/line info from symbol table.
981 if (Spec.FLIKind != FileLineInfoKind::None) {
983 LineTable = getLineTableForUnit(CU);
985 LineTable->getFileLineInfoForAddress(Address, CU->getCompilationDir(),
986 Spec.FLIKind, Frame))
987 InliningInfo.addFrame(Frame);
992 uint32_t CallFile = 0, CallLine = 0, CallColumn = 0, CallDiscriminator = 0;
993 for (uint32_t i = 0, n = InlinedChain.size(); i != n; i++) {
994 DWARFDie &FunctionDIE = InlinedChain[i];
996 // Get function name if necessary.
997 if (const char *Name = FunctionDIE.getSubroutineName(Spec.FNKind))
998 Frame.FunctionName = Name;
999 if (auto DeclLineResult = FunctionDIE.getDeclLine())
1000 Frame.StartLine = DeclLineResult;
1001 if (Spec.FLIKind != FileLineInfoKind::None) {
1003 // For the topmost frame, initialize the line table of this
1004 // compile unit and fetch file/line info from it.
1005 LineTable = getLineTableForUnit(CU);
1006 // For the topmost routine, get file/line info from line table.
1008 LineTable->getFileLineInfoForAddress(Address, CU->getCompilationDir(),
1009 Spec.FLIKind, Frame);
1011 // Otherwise, use call file, call line and call column from
1012 // previous DIE in inlined chain.
1014 LineTable->getFileNameByIndex(CallFile, CU->getCompilationDir(),
1015 Spec.FLIKind, Frame.FileName);
1016 Frame.Line = CallLine;
1017 Frame.Column = CallColumn;
1018 Frame.Discriminator = CallDiscriminator;
1020 // Get call file/line/column of a current DIE.
1022 FunctionDIE.getCallerFrame(CallFile, CallLine, CallColumn,
1026 InliningInfo.addFrame(Frame);
1028 return InliningInfo;
1031 std::shared_ptr<DWARFContext>
1032 DWARFContext::getDWOContext(StringRef AbsolutePath) {
1033 if (auto S = DWP.lock()) {
1034 DWARFContext *Ctxt = S->Context.get();
1035 return std::shared_ptr<DWARFContext>(std::move(S), Ctxt);
1038 std::weak_ptr<DWOFile> *Entry = &DWOFiles[AbsolutePath];
1040 if (auto S = Entry->lock()) {
1041 DWARFContext *Ctxt = S->Context.get();
1042 return std::shared_ptr<DWARFContext>(std::move(S), Ctxt);
1045 SmallString<128> DWPName;
1046 Expected<OwningBinary<ObjectFile>> Obj = [&] {
1047 if (!CheckedForDWP) {
1048 (getFileName() + ".dwp").toVector(DWPName);
1049 auto Obj = object::ObjectFile::createObjectFile(DWPName);
1054 CheckedForDWP = true;
1055 // TODO: Should this error be handled (maybe in a high verbosity mode)
1056 // before falling back to .dwo files?
1057 consumeError(Obj.takeError());
1061 return object::ObjectFile::createObjectFile(AbsolutePath);
1065 // TODO: Actually report errors helpfully.
1066 consumeError(Obj.takeError());
1070 auto S = std::make_shared<DWOFile>();
1071 S->File = std::move(Obj.get());
1072 S->Context = llvm::make_unique<DWARFContextInMemory>(*S->File.getBinary());
1074 auto *Ctxt = S->Context.get();
1075 return std::shared_ptr<DWARFContext>(std::move(S), Ctxt);
1078 static Error createError(const Twine &Reason, llvm::Error E) {
1079 return make_error<StringError>(Reason + toString(std::move(E)),
1080 inconvertibleErrorCode());
1083 /// SymInfo contains information about symbol: it's address
1084 /// and section index which is -1LL for absolute symbols.
1087 uint64_t SectionIndex;
1090 /// Returns the address of symbol relocation used against and a section index.
1091 /// Used for futher relocations computation. Symbol's section load address is
1092 static Expected<SymInfo> getSymbolInfo(const object::ObjectFile &Obj,
1093 const RelocationRef &Reloc,
1094 const LoadedObjectInfo *L,
1095 std::map<SymbolRef, SymInfo> &Cache) {
1096 SymInfo Ret = {0, (uint64_t)-1LL};
1097 object::section_iterator RSec = Obj.section_end();
1098 object::symbol_iterator Sym = Reloc.getSymbol();
1100 std::map<SymbolRef, SymInfo>::iterator CacheIt = Cache.end();
1101 // First calculate the address of the symbol or section as it appears
1102 // in the object file
1103 if (Sym != Obj.symbol_end()) {
1105 std::tie(CacheIt, New) = Cache.insert({*Sym, {0, 0}});
1107 return CacheIt->second;
1109 Expected<uint64_t> SymAddrOrErr = Sym->getAddress();
1111 return createError("error: failed to compute symbol address: ",
1112 SymAddrOrErr.takeError());
1114 // Also remember what section this symbol is in for later
1115 auto SectOrErr = Sym->getSection();
1117 return createError("error: failed to get symbol section: ",
1118 SectOrErr.takeError());
1121 Ret.Address = *SymAddrOrErr;
1122 } else if (auto *MObj = dyn_cast<MachOObjectFile>(&Obj)) {
1123 RSec = MObj->getRelocationSection(Reloc.getRawDataRefImpl());
1124 Ret.Address = RSec->getAddress();
1127 if (RSec != Obj.section_end())
1128 Ret.SectionIndex = RSec->getIndex();
1130 // If we are given load addresses for the sections, we need to adjust:
1131 // SymAddr = (Address of Symbol Or Section in File) -
1132 // (Address of Section in File) +
1133 // (Load Address of Section)
1134 // RSec is now either the section being targeted or the section
1135 // containing the symbol being targeted. In either case,
1136 // we need to perform the same computation.
1137 if (L && RSec != Obj.section_end())
1138 if (uint64_t SectionLoadAddress = L->getSectionLoadAddress(*RSec))
1139 Ret.Address += SectionLoadAddress - RSec->getAddress();
1141 if (CacheIt != Cache.end())
1142 CacheIt->second = Ret;
1147 static bool isRelocScattered(const object::ObjectFile &Obj,
1148 const RelocationRef &Reloc) {
1149 const MachOObjectFile *MachObj = dyn_cast<MachOObjectFile>(&Obj);
1152 // MachO also has relocations that point to sections and
1153 // scattered relocations.
1154 auto RelocInfo = MachObj->getRelocation(Reloc.getRawDataRefImpl());
1155 return MachObj->isRelocationScattered(RelocInfo);
1158 Error DWARFContextInMemory::maybeDecompress(const SectionRef &Sec,
1159 StringRef Name, StringRef &Data) {
1160 if (!Decompressor::isCompressed(Sec))
1161 return Error::success();
1163 Expected<Decompressor> Decompressor =
1164 Decompressor::create(Name, Data, IsLittleEndian, AddressSize == 8);
1166 return Decompressor.takeError();
1168 SmallString<32> Out;
1169 if (auto Err = Decompressor->resizeAndDecompress(Out))
1172 UncompressedSections.emplace_back(std::move(Out));
1173 Data = UncompressedSections.back();
1175 return Error::success();
1178 DWARFContextInMemory::DWARFContextInMemory(const object::ObjectFile &Obj,
1179 const LoadedObjectInfo *L)
1180 : FileName(Obj.getFileName()), IsLittleEndian(Obj.isLittleEndian()),
1181 AddressSize(Obj.getBytesInAddress()) {
1182 for (const SectionRef &Section : Obj.sections()) {
1184 Section.getName(name);
1185 // Skip BSS and Virtual sections, they aren't interesting.
1186 bool IsBSS = Section.isBSS();
1189 bool IsVirtual = Section.isVirtual();
1194 section_iterator RelocatedSection = Section.getRelocatedSection();
1195 // Try to obtain an already relocated version of this section.
1196 // Else use the unrelocated section from the object file. We'll have to
1197 // apply relocations ourselves later.
1198 if (!L || !L->getLoadedSectionContents(*RelocatedSection, data))
1199 Section.getContents(data);
1201 if (auto Err = maybeDecompress(Section, name, data)) {
1202 errs() << "error: failed to decompress '" + name + "', " +
1203 toString(std::move(Err))
1208 // Compressed sections names in GNU style starts from ".z",
1209 // at this point section is decompressed and we drop compression prefix.
1211 name.find_first_not_of("._z")); // Skip ".", "z" and "_" prefixes.
1213 if (StringRef *SectionData = MapSectionToMember(name)) {
1214 *SectionData = data;
1215 if (name == "debug_ranges") {
1216 // FIXME: Use the other dwo range section when we emit it.
1217 RangeDWOSection.Data = data;
1219 } else if (name == "debug_types") {
1220 // Find debug_types data by section rather than name as there are
1221 // multiple, comdat grouped, debug_types sections.
1222 TypesSections[Section].Data = data;
1223 } else if (name == "debug_types.dwo") {
1224 TypesDWOSections[Section].Data = data;
1227 // Map platform specific debug section names to DWARF standard section
1229 name = Obj.mapDebugSectionName(name);
1231 if (RelocatedSection == Obj.section_end())
1234 StringRef RelSecName;
1235 StringRef RelSecData;
1236 RelocatedSection->getName(RelSecName);
1238 // If the section we're relocating was relocated already by the JIT,
1239 // then we used the relocated version above, so we do not need to process
1240 // relocations for it now.
1241 if (L && L->getLoadedSectionContents(*RelocatedSection, RelSecData))
1244 // In Mach-o files, the relocations do not need to be applied if
1245 // there is no load offset to apply. The value read at the
1246 // relocation point already factors in the section address
1247 // (actually applying the relocations will produce wrong results
1248 // as the section address will be added twice).
1249 if (!L && isa<MachOObjectFile>(&Obj))
1252 RelSecName = RelSecName.substr(
1253 RelSecName.find_first_not_of("._")); // Skip . and _ prefixes.
1255 // TODO: Add support for relocations in other sections as needed.
1256 // Record relocations for the debug_info and debug_line sections.
1258 StringSwitch<RelocAddrMap *>(RelSecName)
1259 .Case("debug_info", &InfoSection.Relocs)
1260 .Case("debug_loc", &LocSection.Relocs)
1261 .Case("debug_info.dwo", &InfoDWOSection.Relocs)
1262 .Case("debug_line", &LineSection.Relocs)
1263 .Case("debug_str_offsets", &StringOffsetSection.Relocs)
1264 .Case("debug_ranges", &RangeSection.Relocs)
1265 .Case("debug_addr", &AddrSection.Relocs)
1266 .Case("apple_names", &AppleNamesSection.Relocs)
1267 .Case("apple_types", &AppleTypesSection.Relocs)
1268 .Case("apple_namespaces", &AppleNamespacesSection.Relocs)
1269 .Case("apple_namespac", &AppleNamespacesSection.Relocs)
1270 .Case("apple_objc", &AppleObjCSection.Relocs)
1273 // Find debug_types relocs by section rather than name as there are
1274 // multiple, comdat grouped, debug_types sections.
1275 if (RelSecName == "debug_types")
1276 Map = &TypesSections[*RelocatedSection].Relocs;
1277 else if (RelSecName == "debug_types.dwo")
1278 Map = &TypesDWOSections[*RelocatedSection].Relocs;
1283 if (Section.relocation_begin() == Section.relocation_end())
1286 // Symbol to [address, section index] cache mapping.
1287 std::map<SymbolRef, SymInfo> AddrCache;
1288 for (const RelocationRef &Reloc : Section.relocations()) {
1289 // FIXME: it's not clear how to correctly handle scattered
1291 if (isRelocScattered(Obj, Reloc))
1294 Expected<SymInfo> SymInfoOrErr = getSymbolInfo(Obj, Reloc, L, AddrCache);
1295 if (!SymInfoOrErr) {
1296 errs() << toString(SymInfoOrErr.takeError()) << '\n';
1300 object::RelocVisitor V(Obj);
1301 uint64_t Val = V.visit(Reloc.getType(), Reloc, SymInfoOrErr->Address);
1303 SmallString<32> Name;
1304 Reloc.getTypeName(Name);
1305 errs() << "error: failed to compute relocation: " << Name << "\n";
1308 llvm::RelocAddrEntry Rel = {SymInfoOrErr->SectionIndex, Val};
1309 Map->insert({Reloc.getOffset(), Rel});
1314 DWARFContextInMemory::DWARFContextInMemory(
1315 const StringMap<std::unique_ptr<MemoryBuffer>> &Sections, uint8_t AddrSize,
1316 bool isLittleEndian)
1317 : IsLittleEndian(isLittleEndian), AddressSize(AddrSize) {
1318 for (const auto &SecIt : Sections) {
1319 if (StringRef *SectionData = MapSectionToMember(SecIt.first()))
1320 *SectionData = SecIt.second->getBuffer();
1324 StringRef *DWARFContextInMemory::MapSectionToMember(StringRef Name) {
1325 return StringSwitch<StringRef *>(Name)
1326 .Case("debug_info", &InfoSection.Data)
1327 .Case("debug_abbrev", &AbbrevSection)
1328 .Case("debug_loc", &LocSection.Data)
1329 .Case("debug_line", &LineSection.Data)
1330 .Case("debug_aranges", &ARangeSection)
1331 .Case("debug_frame", &DebugFrameSection)
1332 .Case("eh_frame", &EHFrameSection)
1333 .Case("debug_str", &StringSection)
1334 .Case("debug_str_offsets", &StringOffsetSection.Data)
1335 .Case("debug_ranges", &RangeSection.Data)
1336 .Case("debug_macinfo", &MacinfoSection)
1337 .Case("debug_pubnames", &PubNamesSection)
1338 .Case("debug_pubtypes", &PubTypesSection)
1339 .Case("debug_gnu_pubnames", &GnuPubNamesSection)
1340 .Case("debug_gnu_pubtypes", &GnuPubTypesSection)
1341 .Case("debug_info.dwo", &InfoDWOSection.Data)
1342 .Case("debug_abbrev.dwo", &AbbrevDWOSection)
1343 .Case("debug_loc.dwo", &LocDWOSection.Data)
1344 .Case("debug_line.dwo", &LineDWOSection.Data)
1345 .Case("debug_str.dwo", &StringDWOSection)
1346 .Case("debug_str_offsets.dwo", &StringOffsetDWOSection.Data)
1347 .Case("debug_addr", &AddrSection.Data)
1348 .Case("apple_names", &AppleNamesSection.Data)
1349 .Case("apple_types", &AppleTypesSection.Data)
1350 .Case("apple_namespaces", &AppleNamespacesSection.Data)
1351 .Case("apple_namespac", &AppleNamespacesSection.Data)
1352 .Case("apple_objc", &AppleObjCSection.Data)
1353 .Case("debug_cu_index", &CUIndexSection)
1354 .Case("debug_tu_index", &TUIndexSection)
1355 .Case("gdb_index", &GdbIndexSection)
1356 // Any more debug info sections go here.
1360 void DWARFContextInMemory::anchor() {}