1 //==- include/llvm/CodeGen/AccelTable.h - Accelerator Tables -----*- C++ -*-==//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains support for writing accelerator tables.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #ifndef LLVM_CODEGEN_DWARFACCELTABLE_H
15 #define LLVM_CODEGEN_DWARFACCELTABLE_H
16 
17 #include "llvm/ADT/ArrayRef.h"
18 #include "llvm/ADT/SmallVector.h"
19 #include "llvm/ADT/StringMap.h"
20 #include "llvm/ADT/StringRef.h"
21 #include "llvm/BinaryFormat/Dwarf.h"
22 #include "llvm/CodeGen/DIE.h"
23 #include "llvm/CodeGen/DwarfStringPoolEntry.h"
24 #include "llvm/MC/MCSymbol.h"
25 #include "llvm/Support/Allocator.h"
26 #include "llvm/Support/DJB.h"
27 #include "llvm/Support/Debug.h"
28 #include "llvm/Support/Format.h"
29 #include "llvm/Support/raw_ostream.h"
30 #include <cstddef>
31 #include <cstdint>
32 #include <vector>
33 
34 /// The DWARF and Apple accelerator tables are an indirect hash table optimized
35 /// for null lookup rather than access to known data. The Apple accelerator
36 /// tables are a precursor of the newer DWARF v5 accelerator tables. Both
37 /// formats share common design ideas.
38 ///
39 /// The Apple accelerator table are output into an on-disk format that looks
40 /// like this:
41 ///
42 /// .------------------.
43 /// |  HEADER          |
44 /// |------------------|
45 /// |  BUCKETS         |
46 /// |------------------|
47 /// |  HASHES          |
48 /// |------------------|
49 /// |  OFFSETS         |
50 /// |------------------|
51 /// |  DATA            |
52 /// `------------------'
53 ///
54 /// The header contains a magic number, version, type of hash function,
55 /// the number of buckets, total number of hashes, and room for a special struct
56 /// of data and the length of that struct.
57 ///
58 /// The buckets contain an index (e.g. 6) into the hashes array. The hashes
59 /// section contains all of the 32-bit hash values in contiguous memory, and the
60 /// offsets contain the offset into the data area for the particular hash.
61 ///
62 /// For a lookup example, we could hash a function name and take it modulo the
63 /// number of buckets giving us our bucket. From there we take the bucket value
64 /// as an index into the hashes table and look at each successive hash as long
65 /// as the hash value is still the same modulo result (bucket value) as earlier.
66 /// If we have a match we look at that same entry in the offsets table and grab
67 /// the offset in the data for our final match.
68 ///
69 /// The DWARF v5 accelerator table consists of zero or more name indices that
70 /// are output into an on-disk format that looks like this:
71 ///
72 /// .------------------.
73 /// |  HEADER          |
74 /// |------------------|
75 /// |  CU LIST         |
76 /// |------------------|
77 /// |  LOCAL TU LIST   |
78 /// |------------------|
79 /// |  FOREIGN TU LIST |
80 /// |------------------|
81 /// |  HASH TABLE      |
82 /// |------------------|
83 /// |  NAME TABLE      |
84 /// |------------------|
85 /// |  ABBREV TABLE    |
86 /// |------------------|
87 /// |  ENTRY POOL      |
88 /// `------------------'
89 ///
90 /// For the full documentation please refer to the DWARF 5 standard.
91 ///
92 ///
93 /// This file defines the class template AccelTable, which is represents an
94 /// abstract view of an Accelerator table, without any notion of an on-disk
95 /// layout. This class is parameterized by an entry type, which should derive
96 /// from AccelTableData. This is the type of individual entries in the table,
97 /// and it should store the data necessary to emit them. AppleAccelTableData is
98 /// the base class for Apple Accelerator Table entries, which have a uniform
99 /// structure based on a sequence of Atoms. There are different sub-classes
100 /// derived from AppleAccelTable, which differ in the set of Atoms and how they
101 /// obtain their values.
102 ///
103 /// An Apple Accelerator Table can be serialized by calling emitAppleAccelTable
104 /// function.
105 ///
106 /// TODO: Add DWARF v5 emission code.
107 
108 namespace llvm {
109 
110 class AsmPrinter;
111 class DwarfCompileUnit;
112 class DwarfDebug;
113 
114 /// Interface which the different types of accelerator table data have to
115 /// conform. It serves as a base class for different values of the template
116 /// argument of the AccelTable class template.
117 class AccelTableData {
118 public:
119   virtual ~AccelTableData() = default;
120 
121   bool operator<(const AccelTableData &Other) const {
122     return order() < Other.order();
123   }
124 
125     // Subclasses should implement:
126     // static uint32_t hash(StringRef Name);
127 
128 #ifndef NDEBUG
129   virtual void print(raw_ostream &OS) const = 0;
130 #endif
131 protected:
132   virtual uint64_t order() const = 0;
133 };
134 
135 /// A base class holding non-template-dependant functionality of the AccelTable
136 /// class. Clients should not use this class directly but rather instantiate
137 /// AccelTable with a type derived from AccelTableData.
138 class AccelTableBase {
139 public:
140   using HashFn = uint32_t(StringRef);
141 
142   /// Represents a group of entries with identical name (and hence, hash value).
143   struct HashData {
144     DwarfStringPoolEntryRef Name;
145     uint32_t HashValue;
146     std::vector<AccelTableData *> Values;
147     MCSymbol *Sym;
148 
HashDataHashData149     HashData(DwarfStringPoolEntryRef Name, HashFn *Hash)
150         : Name(Name), HashValue(Hash(Name.getString())) {}
151 
152 #ifndef NDEBUG
153     void print(raw_ostream &OS) const;
dumpHashData154     void dump() const { print(dbgs()); }
155 #endif
156   };
157   using HashList = std::vector<HashData *>;
158   using BucketList = std::vector<HashList>;
159 
160 protected:
161   /// Allocator for HashData and Values.
162   BumpPtrAllocator Allocator;
163 
164   using StringEntries = StringMap<HashData, BumpPtrAllocator &>;
165   StringEntries Entries;
166 
167   HashFn *Hash;
168   uint32_t BucketCount;
169   uint32_t UniqueHashCount;
170 
171   HashList Hashes;
172   BucketList Buckets;
173 
174   void computeBucketCount();
175 
AccelTableBase(HashFn * Hash)176   AccelTableBase(HashFn *Hash) : Entries(Allocator), Hash(Hash) {}
177 
178 public:
179   void finalize(AsmPrinter *Asm, StringRef Prefix);
getBuckets()180   ArrayRef<HashList> getBuckets() const { return Buckets; }
getBucketCount()181   uint32_t getBucketCount() const { return BucketCount; }
getUniqueHashCount()182   uint32_t getUniqueHashCount() const { return UniqueHashCount; }
getUniqueNameCount()183   uint32_t getUniqueNameCount() const { return Entries.size(); }
184 
185 #ifndef NDEBUG
186   void print(raw_ostream &OS) const;
dump()187   void dump() const { print(dbgs()); }
188 #endif
189 
190   AccelTableBase(const AccelTableBase &) = delete;
191   void operator=(const AccelTableBase &) = delete;
192 };
193 
194 /// This class holds an abstract representation of an Accelerator Table,
195 /// consisting of a sequence of buckets, each bucket containint a sequence of
196 /// HashData entries. The class is parameterized by the type of entries it
197 /// holds. The type template parameter also defines the hash function to use for
198 /// hashing names.
199 template <typename DataT> class AccelTable : public AccelTableBase {
200 public:
AccelTable()201   AccelTable() : AccelTableBase(DataT::hash) {}
202 
203   template <typename... Types>
204   void addName(DwarfStringPoolEntryRef Name, Types &&... Args);
205 };
206 
207 template <typename AccelTableDataT>
208 template <typename... Types>
addName(DwarfStringPoolEntryRef Name,Types &&...Args)209 void AccelTable<AccelTableDataT>::addName(DwarfStringPoolEntryRef Name,
210                                           Types &&... Args) {
211   assert(Buckets.empty() && "Already finalized!");
212   // If the string is in the list already then add this die to the list
213   // otherwise add a new one.
214   auto Iter = Entries.try_emplace(Name.getString(), Name, Hash).first;
215   assert(Iter->second.Name == Name);
216   Iter->second.Values.push_back(
217       new (Allocator) AccelTableDataT(std::forward<Types>(Args)...));
218 }
219 
220 /// A base class for different implementations of Data classes for Apple
221 /// Accelerator Tables. The columns in the table are defined by the static Atoms
222 /// variable defined on the subclasses.
223 class AppleAccelTableData : public AccelTableData {
224 public:
225   /// An Atom defines the form of the data in an Apple accelerator table.
226   /// Conceptually it is a column in the accelerator consisting of a type and a
227   /// specification of the form of its data.
228   struct Atom {
229     /// Atom Type.
230     const uint16_t Type;
231     /// DWARF Form.
232     const uint16_t Form;
233 
AtomAtom234     constexpr Atom(uint16_t Type, uint16_t Form) : Type(Type), Form(Form) {}
235 
236 #ifndef NDEBUG
237     void print(raw_ostream &OS) const;
dumpAtom238     void dump() const { print(dbgs()); }
239 #endif
240   };
241   // Subclasses should define:
242   // static constexpr Atom Atoms[];
243 
244   virtual void emit(AsmPrinter *Asm) const = 0;
245 
hash(StringRef Buffer)246   static uint32_t hash(StringRef Buffer) { return djbHash(Buffer); }
247 };
248 
249 /// The Data class implementation for DWARF v5 accelerator table. Unlike the
250 /// Apple Data classes, this class is just a DIE wrapper, and does not know to
251 /// serialize itself. The complete serialization logic is in the
252 /// emitDWARF5AccelTable function.
253 class DWARF5AccelTableData : public AccelTableData {
254 public:
hash(StringRef Name)255   static uint32_t hash(StringRef Name) { return caseFoldingDjbHash(Name); }
256 
DWARF5AccelTableData(const DIE & Die)257   DWARF5AccelTableData(const DIE &Die) : Die(Die) {}
258 
259 #ifndef NDEBUG
260   void print(raw_ostream &OS) const override;
261 #endif
262 
getDie()263   const DIE &getDie() const { return Die; }
getDieOffset()264   uint64_t getDieOffset() const { return Die.getOffset(); }
getDieTag()265   unsigned getDieTag() const { return Die.getTag(); }
266 
267 protected:
268   const DIE &Die;
269 
order()270   uint64_t order() const override { return Die.getOffset(); }
271 };
272 
273 class DWARF5AccelTableStaticData : public AccelTableData {
274 public:
hash(StringRef Name)275   static uint32_t hash(StringRef Name) { return caseFoldingDjbHash(Name); }
276 
DWARF5AccelTableStaticData(uint64_t DieOffset,unsigned DieTag,unsigned CUIndex)277   DWARF5AccelTableStaticData(uint64_t DieOffset, unsigned DieTag,
278                              unsigned CUIndex)
279       : DieOffset(DieOffset), DieTag(DieTag), CUIndex(CUIndex) {}
280 
281 #ifndef NDEBUG
282   void print(raw_ostream &OS) const override;
283 #endif
284 
getDieOffset()285   uint64_t getDieOffset() const { return DieOffset; }
getDieTag()286   unsigned getDieTag() const { return DieTag; }
getCUIndex()287   unsigned getCUIndex() const { return CUIndex; }
288 
289 protected:
290   uint64_t DieOffset;
291   unsigned DieTag;
292   unsigned CUIndex;
293 
order()294   uint64_t order() const override { return DieOffset; }
295 };
296 
297 void emitAppleAccelTableImpl(AsmPrinter *Asm, AccelTableBase &Contents,
298                              StringRef Prefix, const MCSymbol *SecBegin,
299                              ArrayRef<AppleAccelTableData::Atom> Atoms);
300 
301 /// Emit an Apple Accelerator Table consisting of entries in the specified
302 /// AccelTable. The DataT template parameter should be derived from
303 /// AppleAccelTableData.
304 template <typename DataT>
emitAppleAccelTable(AsmPrinter * Asm,AccelTable<DataT> & Contents,StringRef Prefix,const MCSymbol * SecBegin)305 void emitAppleAccelTable(AsmPrinter *Asm, AccelTable<DataT> &Contents,
306                          StringRef Prefix, const MCSymbol *SecBegin) {
307   static_assert(std::is_convertible<DataT *, AppleAccelTableData *>::value, "");
308   emitAppleAccelTableImpl(Asm, Contents, Prefix, SecBegin, DataT::Atoms);
309 }
310 
311 void emitDWARF5AccelTable(AsmPrinter *Asm,
312                           AccelTable<DWARF5AccelTableData> &Contents,
313                           const DwarfDebug &DD,
314                           ArrayRef<std::unique_ptr<DwarfCompileUnit>> CUs);
315 
316 void emitDWARF5AccelTable(
317     AsmPrinter *Asm, AccelTable<DWARF5AccelTableStaticData> &Contents,
318     ArrayRef<MCSymbol *> CUs,
319     llvm::function_ref<unsigned(const DWARF5AccelTableStaticData &)>
320         getCUIndexForEntry);
321 
322 /// Accelerator table data implementation for simple Apple accelerator tables
323 /// with just a DIE reference.
324 class AppleAccelTableOffsetData : public AppleAccelTableData {
325 public:
AppleAccelTableOffsetData(const DIE & D)326   AppleAccelTableOffsetData(const DIE &D) : Die(D) {}
327 
328   void emit(AsmPrinter *Asm) const override;
329 
330 #ifndef _MSC_VER
331   // The line below is rejected by older versions (TBD) of MSVC.
332   static constexpr Atom Atoms[] = {
333       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4)};
334 #else
335   // FIXME: Erase this path once the minimum MSCV version has been bumped.
336   static const SmallVector<Atom, 4> Atoms;
337 #endif
338 
339 #ifndef NDEBUG
340   void print(raw_ostream &OS) const override;
341 #endif
342 protected:
order()343   uint64_t order() const override { return Die.getOffset(); }
344 
345   const DIE &Die;
346 };
347 
348 /// Accelerator table data implementation for Apple type accelerator tables.
349 class AppleAccelTableTypeData : public AppleAccelTableOffsetData {
350 public:
AppleAccelTableTypeData(const DIE & D)351   AppleAccelTableTypeData(const DIE &D) : AppleAccelTableOffsetData(D) {}
352 
353   void emit(AsmPrinter *Asm) const override;
354 
355 #ifndef _MSC_VER
356   // The line below is rejected by older versions (TBD) of MSVC.
357   static constexpr Atom Atoms[] = {
358       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4),
359       Atom(dwarf::DW_ATOM_die_tag, dwarf::DW_FORM_data2),
360       Atom(dwarf::DW_ATOM_type_flags, dwarf::DW_FORM_data1)};
361 #else
362   // FIXME: Erase this path once the minimum MSCV version has been bumped.
363   static const SmallVector<Atom, 4> Atoms;
364 #endif
365 
366 #ifndef NDEBUG
367   void print(raw_ostream &OS) const override;
368 #endif
369 };
370 
371 /// Accelerator table data implementation for simple Apple accelerator tables
372 /// with a DIE offset but no actual DIE pointer.
373 class AppleAccelTableStaticOffsetData : public AppleAccelTableData {
374 public:
AppleAccelTableStaticOffsetData(uint32_t Offset)375   AppleAccelTableStaticOffsetData(uint32_t Offset) : Offset(Offset) {}
376 
377   void emit(AsmPrinter *Asm) const override;
378 
379 #ifndef _MSC_VER
380   // The line below is rejected by older versions (TBD) of MSVC.
381   static constexpr Atom Atoms[] = {
382       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4)};
383 #else
384   // FIXME: Erase this path once the minimum MSCV version has been bumped.
385   static const SmallVector<Atom, 4> Atoms;
386 #endif
387 
388 #ifndef NDEBUG
389   void print(raw_ostream &OS) const override;
390 #endif
391 protected:
order()392   uint64_t order() const override { return Offset; }
393 
394   uint32_t Offset;
395 };
396 
397 /// Accelerator table data implementation for type accelerator tables with
398 /// a DIE offset but no actual DIE pointer.
399 class AppleAccelTableStaticTypeData : public AppleAccelTableStaticOffsetData {
400 public:
AppleAccelTableStaticTypeData(uint32_t Offset,uint16_t Tag,bool ObjCClassIsImplementation,uint32_t QualifiedNameHash)401   AppleAccelTableStaticTypeData(uint32_t Offset, uint16_t Tag,
402                                 bool ObjCClassIsImplementation,
403                                 uint32_t QualifiedNameHash)
404       : AppleAccelTableStaticOffsetData(Offset),
405         QualifiedNameHash(QualifiedNameHash), Tag(Tag),
406         ObjCClassIsImplementation(ObjCClassIsImplementation) {}
407 
408   void emit(AsmPrinter *Asm) const override;
409 
410 #ifndef _MSC_VER
411   // The line below is rejected by older versions (TBD) of MSVC.
412   static constexpr Atom Atoms[] = {
413       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4),
414       Atom(dwarf::DW_ATOM_die_tag, dwarf::DW_FORM_data2),
415       Atom(5, dwarf::DW_FORM_data1), Atom(6, dwarf::DW_FORM_data4)};
416 #else
417   // FIXME: Erase this path once the minimum MSCV version has been bumped.
418   static const SmallVector<Atom, 4> Atoms;
419 #endif
420 
421 #ifndef NDEBUG
422   void print(raw_ostream &OS) const override;
423 #endif
424 protected:
order()425   uint64_t order() const override { return Offset; }
426 
427   uint32_t QualifiedNameHash;
428   uint16_t Tag;
429   bool ObjCClassIsImplementation;
430 };
431 
432 } // end namespace llvm
433 
434 #endif // LLVM_CODEGEN_DWARFACCELTABLE_H
435