[Alignment][NFC] Migrate Instructions to Align
[llvm-core.git] / include / llvm / DebugInfo / DWARF / DWARFAcceleratorTable.h
blobc9042e5932606b28308092e506e730ebb03836b5
1 //===- DWARFAcceleratorTable.h ----------------------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
9 #ifndef LLVM_DEBUGINFO_DWARFACCELERATORTABLE_H
10 #define LLVM_DEBUGINFO_DWARFACCELERATORTABLE_H
12 #include "llvm/ADT/DenseSet.h"
13 #include "llvm/ADT/SmallVector.h"
14 #include "llvm/BinaryFormat/Dwarf.h"
15 #include "llvm/DebugInfo/DWARF/DWARFDataExtractor.h"
16 #include "llvm/DebugInfo/DWARF/DWARFFormValue.h"
17 #include <cstdint>
18 #include <utility>
20 namespace llvm {
22 class raw_ostream;
23 class ScopedPrinter;
25 /// The accelerator tables are designed to allow efficient random access
26 /// (using a symbol name as a key) into debug info by providing an index of the
27 /// debug info DIEs. This class implements the common functionality of Apple and
28 /// DWARF 5 accelerator tables.
29 /// TODO: Generalize the rest of the AppleAcceleratorTable interface and move it
30 /// to this class.
31 class DWARFAcceleratorTable {
32 protected:
33 DWARFDataExtractor AccelSection;
34 DataExtractor StringSection;
36 public:
37 /// An abstract class representing a single entry in the accelerator tables.
38 class Entry {
39 protected:
40 SmallVector<DWARFFormValue, 3> Values;
42 Entry() = default;
44 // Make these protected so only (final) subclasses can be copied around.
45 Entry(const Entry &) = default;
46 Entry(Entry &&) = default;
47 Entry &operator=(const Entry &) = default;
48 Entry &operator=(Entry &&) = default;
49 ~Entry() = default;
52 public:
53 /// Returns the Offset of the Compilation Unit associated with this
54 /// Accelerator Entry or None if the Compilation Unit offset is not recorded
55 /// in this Accelerator Entry.
56 virtual Optional<uint64_t> getCUOffset() const = 0;
58 /// Returns the Tag of the Debug Info Entry associated with this
59 /// Accelerator Entry or None if the Tag is not recorded in this
60 /// Accelerator Entry.
61 virtual Optional<dwarf::Tag> getTag() const = 0;
63 /// Returns the raw values of fields in the Accelerator Entry. In general,
64 /// these can only be interpreted with the help of the metadata in the
65 /// owning Accelerator Table.
66 ArrayRef<DWARFFormValue> getValues() const { return Values; }
69 DWARFAcceleratorTable(const DWARFDataExtractor &AccelSection,
70 DataExtractor StringSection)
71 : AccelSection(AccelSection), StringSection(StringSection) {}
72 virtual ~DWARFAcceleratorTable();
74 virtual Error extract() = 0;
75 virtual void dump(raw_ostream &OS) const = 0;
77 DWARFAcceleratorTable(const DWARFAcceleratorTable &) = delete;
78 void operator=(const DWARFAcceleratorTable &) = delete;
81 /// This implements the Apple accelerator table format, a precursor of the
82 /// DWARF 5 accelerator table format.
83 class AppleAcceleratorTable : public DWARFAcceleratorTable {
84 struct Header {
85 uint32_t Magic;
86 uint16_t Version;
87 uint16_t HashFunction;
88 uint32_t BucketCount;
89 uint32_t HashCount;
90 uint32_t HeaderDataLength;
92 void dump(ScopedPrinter &W) const;
95 struct HeaderData {
96 using AtomType = uint16_t;
97 using Form = dwarf::Form;
99 uint64_t DIEOffsetBase;
100 SmallVector<std::pair<AtomType, Form>, 3> Atoms;
102 Optional<uint64_t> extractOffset(Optional<DWARFFormValue> Value) const;
105 struct Header Hdr;
106 struct HeaderData HdrData;
107 bool IsValid = false;
109 /// Returns true if we should continue scanning for entries or false if we've
110 /// reached the last (sentinel) entry of encountered a parsing error.
111 bool dumpName(ScopedPrinter &W, SmallVectorImpl<DWARFFormValue> &AtomForms,
112 uint64_t *DataOffset) const;
114 public:
115 /// Apple-specific implementation of an Accelerator Entry.
116 class Entry final : public DWARFAcceleratorTable::Entry {
117 const HeaderData *HdrData = nullptr;
119 Entry(const HeaderData &Data);
120 Entry() = default;
122 void extract(const AppleAcceleratorTable &AccelTable, uint64_t *Offset);
124 public:
125 Optional<uint64_t> getCUOffset() const override;
127 /// Returns the Section Offset of the Debug Info Entry associated with this
128 /// Accelerator Entry or None if the DIE offset is not recorded in this
129 /// Accelerator Entry. The returned offset is relative to the start of the
130 /// Section containing the DIE.
131 Optional<uint64_t> getDIESectionOffset() const;
133 Optional<dwarf::Tag> getTag() const override;
135 /// Returns the value of the Atom in this Accelerator Entry, if the Entry
136 /// contains such Atom.
137 Optional<DWARFFormValue> lookup(HeaderData::AtomType Atom) const;
139 friend class AppleAcceleratorTable;
140 friend class ValueIterator;
143 class ValueIterator : public std::iterator<std::input_iterator_tag, Entry> {
144 const AppleAcceleratorTable *AccelTable = nullptr;
145 Entry Current; ///< The current entry.
146 uint64_t DataOffset = 0; ///< Offset into the section.
147 unsigned Data = 0; ///< Current data entry.
148 unsigned NumData = 0; ///< Number of data entries.
150 /// Advance the iterator.
151 void Next();
152 public:
153 /// Construct a new iterator for the entries at \p DataOffset.
154 ValueIterator(const AppleAcceleratorTable &AccelTable, uint64_t DataOffset);
155 /// End marker.
156 ValueIterator() = default;
158 const Entry &operator*() const { return Current; }
159 ValueIterator &operator++() { Next(); return *this; }
160 ValueIterator operator++(int) {
161 ValueIterator I = *this;
162 Next();
163 return I;
165 friend bool operator==(const ValueIterator &A, const ValueIterator &B) {
166 return A.NumData == B.NumData && A.DataOffset == B.DataOffset;
168 friend bool operator!=(const ValueIterator &A, const ValueIterator &B) {
169 return !(A == B);
173 AppleAcceleratorTable(const DWARFDataExtractor &AccelSection,
174 DataExtractor StringSection)
175 : DWARFAcceleratorTable(AccelSection, StringSection) {}
177 Error extract() override;
178 uint32_t getNumBuckets();
179 uint32_t getNumHashes();
180 uint32_t getSizeHdr();
181 uint32_t getHeaderDataLength();
183 /// Return the Atom description, which can be used to interpret the raw values
184 /// of the Accelerator Entries in this table.
185 ArrayRef<std::pair<HeaderData::AtomType, HeaderData::Form>> getAtomsDesc();
186 bool validateForms();
188 /// Return information related to the DWARF DIE we're looking for when
189 /// performing a lookup by name.
191 /// \param HashDataOffset an offset into the hash data table
192 /// \returns <DieOffset, DieTag>
193 /// DieOffset is the offset into the .debug_info section for the DIE
194 /// related to the input hash data offset.
195 /// DieTag is the tag of the DIE
196 std::pair<uint64_t, dwarf::Tag> readAtoms(uint64_t *HashDataOffset);
197 void dump(raw_ostream &OS) const override;
199 /// Look up all entries in the accelerator table matching \c Key.
200 iterator_range<ValueIterator> equal_range(StringRef Key) const;
203 /// .debug_names section consists of one or more units. Each unit starts with a
204 /// header, which is followed by a list of compilation units, local and foreign
205 /// type units.
207 /// These may be followed by an (optional) hash lookup table, which consists of
208 /// an array of buckets and hashes similar to the apple tables above. The only
209 /// difference is that the hashes array is 1-based, and consequently an empty
210 /// bucket is denoted by 0 and not UINT32_MAX.
212 /// Next is the name table, which consists of an array of names and array of
213 /// entry offsets. This is different from the apple tables, which store names
214 /// next to the actual entries.
216 /// The structure of the entries is described by an abbreviations table, which
217 /// comes after the name table. Unlike the apple tables, which have a uniform
218 /// entry structure described in the header, each .debug_names entry may have
219 /// different index attributes (DW_IDX_???) attached to it.
221 /// The last segment consists of a list of entries, which is a 0-terminated list
222 /// referenced by the name table and interpreted with the help of the
223 /// abbreviation table.
224 class DWARFDebugNames : public DWARFAcceleratorTable {
225 /// The fixed-size part of a DWARF v5 Name Index header
226 struct HeaderPOD {
227 uint32_t UnitLength;
228 uint16_t Version;
229 uint16_t Padding;
230 uint32_t CompUnitCount;
231 uint32_t LocalTypeUnitCount;
232 uint32_t ForeignTypeUnitCount;
233 uint32_t BucketCount;
234 uint32_t NameCount;
235 uint32_t AbbrevTableSize;
236 uint32_t AugmentationStringSize;
239 public:
240 class NameIndex;
241 class NameIterator;
242 class ValueIterator;
244 /// DWARF v5 Name Index header.
245 struct Header : public HeaderPOD {
246 SmallString<8> AugmentationString;
248 Error extract(const DWARFDataExtractor &AS, uint64_t *Offset);
249 void dump(ScopedPrinter &W) const;
252 /// Index attribute and its encoding.
253 struct AttributeEncoding {
254 dwarf::Index Index;
255 dwarf::Form Form;
257 constexpr AttributeEncoding(dwarf::Index Index, dwarf::Form Form)
258 : Index(Index), Form(Form) {}
260 friend bool operator==(const AttributeEncoding &LHS,
261 const AttributeEncoding &RHS) {
262 return LHS.Index == RHS.Index && LHS.Form == RHS.Form;
266 /// Abbreviation describing the encoding of Name Index entries.
267 struct Abbrev {
268 uint32_t Code; ///< Abbreviation code
269 dwarf::Tag Tag; ///< Dwarf Tag of the described entity.
270 std::vector<AttributeEncoding> Attributes; ///< List of index attributes.
272 Abbrev(uint32_t Code, dwarf::Tag Tag,
273 std::vector<AttributeEncoding> Attributes)
274 : Code(Code), Tag(Tag), Attributes(std::move(Attributes)) {}
276 void dump(ScopedPrinter &W) const;
279 /// DWARF v5-specific implementation of an Accelerator Entry.
280 class Entry final : public DWARFAcceleratorTable::Entry {
281 const NameIndex *NameIdx;
282 const Abbrev *Abbr;
284 Entry(const NameIndex &NameIdx, const Abbrev &Abbr);
286 public:
287 Optional<uint64_t> getCUOffset() const override;
288 Optional<dwarf::Tag> getTag() const override { return tag(); }
290 /// Returns the Index into the Compilation Unit list of the owning Name
291 /// Index or None if this Accelerator Entry does not have an associated
292 /// Compilation Unit. It is up to the user to verify that the returned Index
293 /// is valid in the owning NameIndex (or use getCUOffset(), which will
294 /// handle that check itself). Note that entries in NameIndexes which index
295 /// just a single Compilation Unit are implicitly associated with that unit,
296 /// so this function will return 0 even without an explicit
297 /// DW_IDX_compile_unit attribute.
298 Optional<uint64_t> getCUIndex() const;
300 /// .debug_names-specific getter, which always succeeds (DWARF v5 index
301 /// entries always have a tag).
302 dwarf::Tag tag() const { return Abbr->Tag; }
304 /// Returns the Offset of the DIE within the containing CU or TU.
305 Optional<uint64_t> getDIEUnitOffset() const;
307 /// Return the Abbreviation that can be used to interpret the raw values of
308 /// this Accelerator Entry.
309 const Abbrev &getAbbrev() const { return *Abbr; }
311 /// Returns the value of the Index Attribute in this Accelerator Entry, if
312 /// the Entry contains such Attribute.
313 Optional<DWARFFormValue> lookup(dwarf::Index Index) const;
315 void dump(ScopedPrinter &W) const;
317 friend class NameIndex;
318 friend class ValueIterator;
321 /// Error returned by NameIndex::getEntry to report it has reached the end of
322 /// the entry list.
323 class SentinelError : public ErrorInfo<SentinelError> {
324 public:
325 static char ID;
327 void log(raw_ostream &OS) const override { OS << "Sentinel"; }
328 std::error_code convertToErrorCode() const override;
331 private:
332 /// DenseMapInfo for struct Abbrev.
333 struct AbbrevMapInfo {
334 static Abbrev getEmptyKey();
335 static Abbrev getTombstoneKey();
336 static unsigned getHashValue(uint32_t Code) {
337 return DenseMapInfo<uint32_t>::getHashValue(Code);
339 static unsigned getHashValue(const Abbrev &Abbr) {
340 return getHashValue(Abbr.Code);
342 static bool isEqual(uint32_t LHS, const Abbrev &RHS) {
343 return LHS == RHS.Code;
345 static bool isEqual(const Abbrev &LHS, const Abbrev &RHS) {
346 return LHS.Code == RHS.Code;
350 public:
351 /// A single entry in the Name Table (DWARF v5 sect. 6.1.1.4.6) of the Name
352 /// Index.
353 class NameTableEntry {
354 DataExtractor StrData;
356 uint32_t Index;
357 uint64_t StringOffset;
358 uint64_t EntryOffset;
360 public:
361 NameTableEntry(const DataExtractor &StrData, uint32_t Index,
362 uint64_t StringOffset, uint64_t EntryOffset)
363 : StrData(StrData), Index(Index), StringOffset(StringOffset),
364 EntryOffset(EntryOffset) {}
366 /// Return the index of this name in the parent Name Index.
367 uint32_t getIndex() const { return Index; }
369 /// Returns the offset of the name of the described entities.
370 uint64_t getStringOffset() const { return StringOffset; }
372 /// Return the string referenced by this name table entry or nullptr if the
373 /// string offset is not valid.
374 const char *getString() const {
375 uint64_t Off = StringOffset;
376 return StrData.getCStr(&Off);
379 /// Returns the offset of the first Entry in the list.
380 uint64_t getEntryOffset() const { return EntryOffset; }
383 /// Represents a single accelerator table within the DWARF v5 .debug_names
384 /// section.
385 class NameIndex {
386 DenseSet<Abbrev, AbbrevMapInfo> Abbrevs;
387 struct Header Hdr;
388 const DWARFDebugNames &Section;
390 // Base of the whole unit and of various important tables, as offsets from
391 // the start of the section.
392 uint64_t Base;
393 uint64_t CUsBase;
394 uint64_t BucketsBase;
395 uint64_t HashesBase;
396 uint64_t StringOffsetsBase;
397 uint64_t EntryOffsetsBase;
398 uint64_t EntriesBase;
400 void dumpCUs(ScopedPrinter &W) const;
401 void dumpLocalTUs(ScopedPrinter &W) const;
402 void dumpForeignTUs(ScopedPrinter &W) const;
403 void dumpAbbreviations(ScopedPrinter &W) const;
404 bool dumpEntry(ScopedPrinter &W, uint64_t *Offset) const;
405 void dumpName(ScopedPrinter &W, const NameTableEntry &NTE,
406 Optional<uint32_t> Hash) const;
407 void dumpBucket(ScopedPrinter &W, uint32_t Bucket) const;
409 Expected<AttributeEncoding> extractAttributeEncoding(uint64_t *Offset);
411 Expected<std::vector<AttributeEncoding>>
412 extractAttributeEncodings(uint64_t *Offset);
414 Expected<Abbrev> extractAbbrev(uint64_t *Offset);
416 public:
417 NameIndex(const DWARFDebugNames &Section, uint64_t Base)
418 : Section(Section), Base(Base) {}
420 /// Reads offset of compilation unit CU. CU is 0-based.
421 uint64_t getCUOffset(uint32_t CU) const;
422 uint32_t getCUCount() const { return Hdr.CompUnitCount; }
424 /// Reads offset of local type unit TU, TU is 0-based.
425 uint64_t getLocalTUOffset(uint32_t TU) const;
426 uint32_t getLocalTUCount() const { return Hdr.LocalTypeUnitCount; }
428 /// Reads signature of foreign type unit TU. TU is 0-based.
429 uint64_t getForeignTUSignature(uint32_t TU) const;
430 uint32_t getForeignTUCount() const { return Hdr.ForeignTypeUnitCount; }
432 /// Reads an entry in the Bucket Array for the given Bucket. The returned
433 /// value is a (1-based) index into the Names, StringOffsets and
434 /// EntryOffsets arrays. The input Bucket index is 0-based.
435 uint32_t getBucketArrayEntry(uint32_t Bucket) const;
436 uint32_t getBucketCount() const { return Hdr.BucketCount; }
438 /// Reads an entry in the Hash Array for the given Index. The input Index
439 /// is 1-based.
440 uint32_t getHashArrayEntry(uint32_t Index) const;
442 /// Reads an entry in the Name Table for the given Index. The Name Table
443 /// consists of two arrays -- String Offsets and Entry Offsets. The returned
444 /// offsets are relative to the starts of respective sections. Input Index
445 /// is 1-based.
446 NameTableEntry getNameTableEntry(uint32_t Index) const;
448 uint32_t getNameCount() const { return Hdr.NameCount; }
450 const DenseSet<Abbrev, AbbrevMapInfo> &getAbbrevs() const {
451 return Abbrevs;
454 Expected<Entry> getEntry(uint64_t *Offset) const;
456 /// Look up all entries in this Name Index matching \c Key.
457 iterator_range<ValueIterator> equal_range(StringRef Key) const;
459 NameIterator begin() const { return NameIterator(this, 1); }
460 NameIterator end() const { return NameIterator(this, getNameCount() + 1); }
462 Error extract();
463 uint64_t getUnitOffset() const { return Base; }
464 uint64_t getNextUnitOffset() const { return Base + 4 + Hdr.UnitLength; }
465 void dump(ScopedPrinter &W) const;
467 friend class DWARFDebugNames;
470 class ValueIterator : public std::iterator<std::input_iterator_tag, Entry> {
472 /// The Name Index we are currently iterating through. The implementation
473 /// relies on the fact that this can also be used as an iterator into the
474 /// "NameIndices" vector in the Accelerator section.
475 const NameIndex *CurrentIndex = nullptr;
477 /// Whether this is a local iterator (searches in CurrentIndex only) or not
478 /// (searches all name indices).
479 bool IsLocal;
481 Optional<Entry> CurrentEntry;
482 uint64_t DataOffset = 0; ///< Offset into the section.
483 std::string Key; ///< The Key we are searching for.
484 Optional<uint32_t> Hash; ///< Hash of Key, if it has been computed.
486 bool getEntryAtCurrentOffset();
487 Optional<uint64_t> findEntryOffsetInCurrentIndex();
488 bool findInCurrentIndex();
489 void searchFromStartOfCurrentIndex();
490 void next();
492 /// Set the iterator to the "end" state.
493 void setEnd() { *this = ValueIterator(); }
495 public:
496 /// Create a "begin" iterator for looping over all entries in the
497 /// accelerator table matching Key. The iterator will run through all Name
498 /// Indexes in the section in sequence.
499 ValueIterator(const DWARFDebugNames &AccelTable, StringRef Key);
501 /// Create a "begin" iterator for looping over all entries in a specific
502 /// Name Index. Other indices in the section will not be visited.
503 ValueIterator(const NameIndex &NI, StringRef Key);
505 /// End marker.
506 ValueIterator() = default;
508 const Entry &operator*() const { return *CurrentEntry; }
509 ValueIterator &operator++() {
510 next();
511 return *this;
513 ValueIterator operator++(int) {
514 ValueIterator I = *this;
515 next();
516 return I;
519 friend bool operator==(const ValueIterator &A, const ValueIterator &B) {
520 return A.CurrentIndex == B.CurrentIndex && A.DataOffset == B.DataOffset;
522 friend bool operator!=(const ValueIterator &A, const ValueIterator &B) {
523 return !(A == B);
527 class NameIterator {
529 /// The Name Index we are iterating through.
530 const NameIndex *CurrentIndex;
532 /// The current name in the Name Index.
533 uint32_t CurrentName;
535 void next() {
536 assert(CurrentName <= CurrentIndex->getNameCount());
537 ++CurrentName;
540 public:
541 using iterator_category = std::input_iterator_tag;
542 using value_type = NameTableEntry;
543 using difference_type = uint32_t;
544 using pointer = NameTableEntry *;
545 using reference = NameTableEntry; // We return entries by value.
547 /// Creates an iterator whose initial position is name CurrentName in
548 /// CurrentIndex.
549 NameIterator(const NameIndex *CurrentIndex, uint32_t CurrentName)
550 : CurrentIndex(CurrentIndex), CurrentName(CurrentName) {}
552 NameTableEntry operator*() const {
553 return CurrentIndex->getNameTableEntry(CurrentName);
555 NameIterator &operator++() {
556 next();
557 return *this;
559 NameIterator operator++(int) {
560 NameIterator I = *this;
561 next();
562 return I;
565 friend bool operator==(const NameIterator &A, const NameIterator &B) {
566 return A.CurrentIndex == B.CurrentIndex && A.CurrentName == B.CurrentName;
568 friend bool operator!=(const NameIterator &A, const NameIterator &B) {
569 return !(A == B);
573 private:
574 SmallVector<NameIndex, 0> NameIndices;
575 DenseMap<uint64_t, const NameIndex *> CUToNameIndex;
577 public:
578 DWARFDebugNames(const DWARFDataExtractor &AccelSection,
579 DataExtractor StringSection)
580 : DWARFAcceleratorTable(AccelSection, StringSection) {}
582 Error extract() override;
583 void dump(raw_ostream &OS) const override;
585 /// Look up all entries in the accelerator table matching \c Key.
586 iterator_range<ValueIterator> equal_range(StringRef Key) const;
588 using const_iterator = SmallVector<NameIndex, 0>::const_iterator;
589 const_iterator begin() const { return NameIndices.begin(); }
590 const_iterator end() const { return NameIndices.end(); }
592 /// Return the Name Index covering the compile unit at CUOffset, or nullptr if
593 /// there is no Name Index covering that unit.
594 const NameIndex *getCUNameIndex(uint64_t CUOffset);
597 } // end namespace llvm
599 #endif // LLVM_DEBUGINFO_DWARFACCELERATORTABLE_H