1 //===-- DWARFUnit.cpp -----------------------------------------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9
10 #include "llvm/DebugInfo/DWARF/DWARFUnit.h"
11 #include "llvm/DebugInfo/DWARF/DWARFContext.h"
12 #include "llvm/DebugInfo/DWARF/DWARFFormValue.h"
13 #include "llvm/Support/Dwarf.h"
14 #include "llvm/Support/Path.h"
15 #include <cstdio>
16
17 namespace llvm {
18 using namespace dwarf;
19
parse(DWARFContext & C,const DWARFSection & Section)20 void DWARFUnitSectionBase::parse(DWARFContext &C, const DWARFSection &Section) {
21 parseImpl(C, Section, C.getDebugAbbrev(), C.getRangeSection(),
22 C.getStringSection(), StringRef(), C.getAddrSection(),
23 C.getLineSection().Data, C.isLittleEndian(), false);
24 }
25
parseDWO(DWARFContext & C,const DWARFSection & DWOSection,DWARFUnitIndex * Index)26 void DWARFUnitSectionBase::parseDWO(DWARFContext &C,
27 const DWARFSection &DWOSection,
28 DWARFUnitIndex *Index) {
29 parseImpl(C, DWOSection, C.getDebugAbbrevDWO(), C.getRangeDWOSection(),
30 C.getStringDWOSection(), C.getStringOffsetDWOSection(),
31 C.getAddrSection(), C.getLineDWOSection().Data, C.isLittleEndian(),
32 true);
33 }
34
DWARFUnit(DWARFContext & DC,const DWARFSection & Section,const DWARFDebugAbbrev * DA,StringRef RS,StringRef SS,StringRef SOS,StringRef AOS,StringRef LS,bool LE,bool IsDWO,const DWARFUnitSectionBase & UnitSection,const DWARFUnitIndex::Entry * IndexEntry)35 DWARFUnit::DWARFUnit(DWARFContext &DC, const DWARFSection &Section,
36 const DWARFDebugAbbrev *DA, StringRef RS, StringRef SS,
37 StringRef SOS, StringRef AOS, StringRef LS, bool LE,
38 bool IsDWO, const DWARFUnitSectionBase &UnitSection,
39 const DWARFUnitIndex::Entry *IndexEntry)
40 : Context(DC), InfoSection(Section), Abbrev(DA), RangeSection(RS),
41 LineSection(LS), StringSection(SS), StringOffsetSection([&]() {
42 if (IndexEntry)
43 if (const auto *C = IndexEntry->getOffset(DW_SECT_STR_OFFSETS))
44 return SOS.slice(C->Offset, C->Offset + C->Length);
45 return SOS;
46 }()),
47 AddrOffsetSection(AOS), isLittleEndian(LE), isDWO(IsDWO),
48 UnitSection(UnitSection), IndexEntry(IndexEntry) {
49 clear();
50 }
51
~DWARFUnit()52 DWARFUnit::~DWARFUnit() {
53 }
54
getAddrOffsetSectionItem(uint32_t Index,uint64_t & Result) const55 bool DWARFUnit::getAddrOffsetSectionItem(uint32_t Index,
56 uint64_t &Result) const {
57 uint32_t Offset = AddrOffsetSectionBase + Index * AddrSize;
58 if (AddrOffsetSection.size() < Offset + AddrSize)
59 return false;
60 DataExtractor DA(AddrOffsetSection, isLittleEndian, AddrSize);
61 Result = DA.getAddress(&Offset);
62 return true;
63 }
64
getStringOffsetSectionItem(uint32_t Index,uint32_t & Result) const65 bool DWARFUnit::getStringOffsetSectionItem(uint32_t Index,
66 uint32_t &Result) const {
67 // FIXME: string offset section entries are 8-byte for DWARF64.
68 const uint32_t ItemSize = 4;
69 uint32_t Offset = Index * ItemSize;
70 if (StringOffsetSection.size() < Offset + ItemSize)
71 return false;
72 DataExtractor DA(StringOffsetSection, isLittleEndian, 0);
73 Result = DA.getU32(&Offset);
74 return true;
75 }
76
extractImpl(DataExtractor debug_info,uint32_t * offset_ptr)77 bool DWARFUnit::extractImpl(DataExtractor debug_info, uint32_t *offset_ptr) {
78 Length = debug_info.getU32(offset_ptr);
79 Version = debug_info.getU16(offset_ptr);
80 uint64_t AbbrOffset = debug_info.getU32(offset_ptr);
81 if (IndexEntry) {
82 if (AbbrOffset)
83 return false;
84 auto *UnitContrib = IndexEntry->getOffset();
85 if (!UnitContrib || UnitContrib->Length != (Length + 4))
86 return false;
87 auto *AbbrEntry = IndexEntry->getOffset(DW_SECT_ABBREV);
88 if (!AbbrEntry)
89 return false;
90 AbbrOffset = AbbrEntry->Offset;
91 }
92 AddrSize = debug_info.getU8(offset_ptr);
93
94 bool LengthOK = debug_info.isValidOffset(getNextUnitOffset() - 1);
95 bool VersionOK = DWARFContext::isSupportedVersion(Version);
96 bool AddrSizeOK = AddrSize == 4 || AddrSize == 8;
97
98 if (!LengthOK || !VersionOK || !AddrSizeOK)
99 return false;
100
101 Abbrevs = Abbrev->getAbbreviationDeclarationSet(AbbrOffset);
102 return Abbrevs != nullptr;
103 }
104
extract(DataExtractor debug_info,uint32_t * offset_ptr)105 bool DWARFUnit::extract(DataExtractor debug_info, uint32_t *offset_ptr) {
106 clear();
107
108 Offset = *offset_ptr;
109
110 if (debug_info.isValidOffset(*offset_ptr)) {
111 if (extractImpl(debug_info, offset_ptr))
112 return true;
113
114 // reset the offset to where we tried to parse from if anything went wrong
115 *offset_ptr = Offset;
116 }
117
118 return false;
119 }
120
extractRangeList(uint32_t RangeListOffset,DWARFDebugRangeList & RangeList) const121 bool DWARFUnit::extractRangeList(uint32_t RangeListOffset,
122 DWARFDebugRangeList &RangeList) const {
123 // Require that compile unit is extracted.
124 assert(DieArray.size() > 0);
125 DataExtractor RangesData(RangeSection, isLittleEndian, AddrSize);
126 uint32_t ActualRangeListOffset = RangeSectionBase + RangeListOffset;
127 return RangeList.extract(RangesData, &ActualRangeListOffset);
128 }
129
clear()130 void DWARFUnit::clear() {
131 Offset = 0;
132 Length = 0;
133 Version = 0;
134 Abbrevs = nullptr;
135 AddrSize = 0;
136 BaseAddr = 0;
137 RangeSectionBase = 0;
138 AddrOffsetSectionBase = 0;
139 clearDIEs(false);
140 DWO.reset();
141 }
142
getCompilationDir()143 const char *DWARFUnit::getCompilationDir() {
144 extractDIEsIfNeeded(true);
145 if (DieArray.empty())
146 return nullptr;
147 return DieArray[0].getAttributeValueAsString(this, DW_AT_comp_dir, nullptr);
148 }
149
getDWOId()150 uint64_t DWARFUnit::getDWOId() {
151 extractDIEsIfNeeded(true);
152 const uint64_t FailValue = -1ULL;
153 if (DieArray.empty())
154 return FailValue;
155 return DieArray[0]
156 .getAttributeValueAsUnsignedConstant(this, DW_AT_GNU_dwo_id, FailValue);
157 }
158
setDIERelations()159 void DWARFUnit::setDIERelations() {
160 if (DieArray.size() <= 1)
161 return;
162
163 std::vector<DWARFDebugInfoEntryMinimal *> ParentChain;
164 DWARFDebugInfoEntryMinimal *SiblingChain = nullptr;
165 for (auto &DIE : DieArray) {
166 if (SiblingChain) {
167 SiblingChain->setSibling(&DIE);
168 }
169 if (const DWARFAbbreviationDeclaration *AbbrDecl =
170 DIE.getAbbreviationDeclarationPtr()) {
171 // Normal DIE.
172 if (AbbrDecl->hasChildren()) {
173 ParentChain.push_back(&DIE);
174 SiblingChain = nullptr;
175 } else {
176 SiblingChain = &DIE;
177 }
178 } else {
179 // NULL entry terminates the sibling chain.
180 SiblingChain = ParentChain.back();
181 ParentChain.pop_back();
182 }
183 }
184 assert(SiblingChain == nullptr || SiblingChain == &DieArray[0]);
185 assert(ParentChain.empty());
186 }
187
extractDIEsToVector(bool AppendCUDie,bool AppendNonCUDies,std::vector<DWARFDebugInfoEntryMinimal> & Dies) const188 void DWARFUnit::extractDIEsToVector(
189 bool AppendCUDie, bool AppendNonCUDies,
190 std::vector<DWARFDebugInfoEntryMinimal> &Dies) const {
191 if (!AppendCUDie && !AppendNonCUDies)
192 return;
193
194 // Set the offset to that of the first DIE and calculate the start of the
195 // next compilation unit header.
196 uint32_t DIEOffset = Offset + getHeaderSize();
197 uint32_t NextCUOffset = getNextUnitOffset();
198 DWARFDebugInfoEntryMinimal DIE;
199 uint32_t Depth = 0;
200 bool IsCUDie = true;
201
202 while (DIEOffset < NextCUOffset && DIE.extractFast(this, &DIEOffset)) {
203 if (IsCUDie) {
204 if (AppendCUDie)
205 Dies.push_back(DIE);
206 if (!AppendNonCUDies)
207 break;
208 // The average bytes per DIE entry has been seen to be
209 // around 14-20 so let's pre-reserve the needed memory for
210 // our DIE entries accordingly.
211 Dies.reserve(Dies.size() + getDebugInfoSize() / 14);
212 IsCUDie = false;
213 } else {
214 Dies.push_back(DIE);
215 }
216
217 if (const DWARFAbbreviationDeclaration *AbbrDecl =
218 DIE.getAbbreviationDeclarationPtr()) {
219 // Normal DIE
220 if (AbbrDecl->hasChildren())
221 ++Depth;
222 } else {
223 // NULL DIE.
224 if (Depth > 0)
225 --Depth;
226 if (Depth == 0)
227 break; // We are done with this compile unit!
228 }
229 }
230
231 // Give a little bit of info if we encounter corrupt DWARF (our offset
232 // should always terminate at or before the start of the next compilation
233 // unit header).
234 if (DIEOffset > NextCUOffset)
235 fprintf(stderr, "warning: DWARF compile unit extends beyond its "
236 "bounds cu 0x%8.8x at 0x%8.8x'\n", getOffset(), DIEOffset);
237 }
238
extractDIEsIfNeeded(bool CUDieOnly)239 size_t DWARFUnit::extractDIEsIfNeeded(bool CUDieOnly) {
240 if ((CUDieOnly && DieArray.size() > 0) ||
241 DieArray.size() > 1)
242 return 0; // Already parsed.
243
244 bool HasCUDie = DieArray.size() > 0;
245 extractDIEsToVector(!HasCUDie, !CUDieOnly, DieArray);
246
247 if (DieArray.empty())
248 return 0;
249
250 // If CU DIE was just parsed, copy several attribute values from it.
251 if (!HasCUDie) {
252 uint64_t BaseAddr =
253 DieArray[0].getAttributeValueAsAddress(this, DW_AT_low_pc, -1ULL);
254 if (BaseAddr == -1ULL)
255 BaseAddr = DieArray[0].getAttributeValueAsAddress(this, DW_AT_entry_pc, 0);
256 setBaseAddress(BaseAddr);
257 AddrOffsetSectionBase = DieArray[0].getAttributeValueAsSectionOffset(
258 this, DW_AT_GNU_addr_base, 0);
259 RangeSectionBase = DieArray[0].getAttributeValueAsSectionOffset(
260 this, DW_AT_ranges_base, 0);
261 // Don't fall back to DW_AT_GNU_ranges_base: it should be ignored for
262 // skeleton CU DIE, so that DWARF users not aware of it are not broken.
263 }
264
265 setDIERelations();
266 return DieArray.size();
267 }
268
DWOHolder(StringRef DWOPath)269 DWARFUnit::DWOHolder::DWOHolder(StringRef DWOPath)
270 : DWOFile(), DWOContext(), DWOU(nullptr) {
271 auto Obj = object::ObjectFile::createObjectFile(DWOPath);
272 if (!Obj) {
273 // TODO: Actually report errors helpfully.
274 consumeError(Obj.takeError());
275 return;
276 }
277 DWOFile = std::move(Obj.get());
278 DWOContext.reset(
279 cast<DWARFContext>(new DWARFContextInMemory(*DWOFile.getBinary())));
280 if (DWOContext->getNumDWOCompileUnits() > 0)
281 DWOU = DWOContext->getDWOCompileUnitAtIndex(0);
282 }
283
parseDWO()284 bool DWARFUnit::parseDWO() {
285 if (isDWO)
286 return false;
287 if (DWO.get())
288 return false;
289 extractDIEsIfNeeded(true);
290 if (DieArray.empty())
291 return false;
292 const char *DWOFileName =
293 DieArray[0].getAttributeValueAsString(this, DW_AT_GNU_dwo_name, nullptr);
294 if (!DWOFileName)
295 return false;
296 const char *CompilationDir =
297 DieArray[0].getAttributeValueAsString(this, DW_AT_comp_dir, nullptr);
298 SmallString<16> AbsolutePath;
299 if (sys::path::is_relative(DWOFileName) && CompilationDir != nullptr) {
300 sys::path::append(AbsolutePath, CompilationDir);
301 }
302 sys::path::append(AbsolutePath, DWOFileName);
303 DWO = llvm::make_unique<DWOHolder>(AbsolutePath);
304 DWARFUnit *DWOCU = DWO->getUnit();
305 // Verify that compile unit in .dwo file is valid.
306 if (!DWOCU || DWOCU->getDWOId() != getDWOId()) {
307 DWO.reset();
308 return false;
309 }
310 // Share .debug_addr and .debug_ranges section with compile unit in .dwo
311 DWOCU->setAddrOffsetSection(AddrOffsetSection, AddrOffsetSectionBase);
312 uint32_t DWORangesBase = DieArray[0].getRangesBaseAttribute(this, 0);
313 DWOCU->setRangesSection(RangeSection, DWORangesBase);
314 return true;
315 }
316
clearDIEs(bool KeepCUDie)317 void DWARFUnit::clearDIEs(bool KeepCUDie) {
318 if (DieArray.size() > (unsigned)KeepCUDie) {
319 // std::vectors never get any smaller when resized to a smaller size,
320 // or when clear() or erase() are called, the size will report that it
321 // is smaller, but the memory allocated remains intact (call capacity()
322 // to see this). So we need to create a temporary vector and swap the
323 // contents which will cause just the internal pointers to be swapped
324 // so that when temporary vector goes out of scope, it will destroy the
325 // contents.
326 std::vector<DWARFDebugInfoEntryMinimal> TmpArray;
327 DieArray.swap(TmpArray);
328 // Save at least the compile unit DIE
329 if (KeepCUDie)
330 DieArray.push_back(TmpArray.front());
331 }
332 }
333
collectAddressRanges(DWARFAddressRangesVector & CURanges)334 void DWARFUnit::collectAddressRanges(DWARFAddressRangesVector &CURanges) {
335 const auto *U = getUnitDIE();
336 if (U == nullptr)
337 return;
338 // First, check if unit DIE describes address ranges for the whole unit.
339 const auto &CUDIERanges = U->getAddressRanges(this);
340 if (!CUDIERanges.empty()) {
341 CURanges.insert(CURanges.end(), CUDIERanges.begin(), CUDIERanges.end());
342 return;
343 }
344
345 // This function is usually called if there in no .debug_aranges section
346 // in order to produce a compile unit level set of address ranges that
347 // is accurate. If the DIEs weren't parsed, then we don't want all dies for
348 // all compile units to stay loaded when they weren't needed. So we can end
349 // up parsing the DWARF and then throwing them all away to keep memory usage
350 // down.
351 const bool ClearDIEs = extractDIEsIfNeeded(false) > 1;
352 DieArray[0].collectChildrenAddressRanges(this, CURanges);
353
354 // Collect address ranges from DIEs in .dwo if necessary.
355 bool DWOCreated = parseDWO();
356 if (DWO.get())
357 DWO->getUnit()->collectAddressRanges(CURanges);
358 if (DWOCreated)
359 DWO.reset();
360
361 // Keep memory down by clearing DIEs if this generate function
362 // caused them to be parsed.
363 if (ClearDIEs)
364 clearDIEs(true);
365 }
366
367 const DWARFDebugInfoEntryMinimal *
getSubprogramForAddress(uint64_t Address)368 DWARFUnit::getSubprogramForAddress(uint64_t Address) {
369 extractDIEsIfNeeded(false);
370 for (const DWARFDebugInfoEntryMinimal &DIE : DieArray) {
371 if (DIE.isSubprogramDIE() &&
372 DIE.addressRangeContainsAddress(this, Address)) {
373 return &DIE;
374 }
375 }
376 return nullptr;
377 }
378
379 DWARFDebugInfoEntryInlinedChain
getInlinedChainForAddress(uint64_t Address)380 DWARFUnit::getInlinedChainForAddress(uint64_t Address) {
381 // First, find a subprogram that contains the given address (the root
382 // of inlined chain).
383 const DWARFUnit *ChainCU = nullptr;
384 const DWARFDebugInfoEntryMinimal *SubprogramDIE;
385 // Try to look for subprogram DIEs in the DWO file.
386 parseDWO();
387 if (DWO) {
388 if ((SubprogramDIE = DWO->getUnit()->getSubprogramForAddress(Address)))
389 ChainCU = DWO->getUnit();
390 } else if ((SubprogramDIE = getSubprogramForAddress(Address)))
391 ChainCU = this;
392
393 // Get inlined chain rooted at this subprogram DIE.
394 if (!SubprogramDIE)
395 return DWARFDebugInfoEntryInlinedChain();
396 return SubprogramDIE->getInlinedChainForAddress(ChainCU, Address);
397 }
398
getDWARFUnitIndex(DWARFContext & Context,DWARFSectionKind Kind)399 const DWARFUnitIndex &getDWARFUnitIndex(DWARFContext &Context,
400 DWARFSectionKind Kind) {
401 if (Kind == DW_SECT_INFO)
402 return Context.getCUIndex();
403 assert(Kind == DW_SECT_TYPES);
404 return Context.getTUIndex();
405 }
406 }
407