1 //==- include/llvm/CodeGen/AccelTable.h - Accelerator Tables -----*- C++ -*-==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 /// \file
9 /// This file contains support for writing accelerator tables.
10 ///
11 //===----------------------------------------------------------------------===//
12 
13 #ifndef LLVM_CODEGEN_ACCELTABLE_H
14 #define LLVM_CODEGEN_ACCELTABLE_H
15 
16 #include "llvm/ADT/ArrayRef.h"
17 #include "llvm/ADT/MapVector.h"
18 #include "llvm/ADT/STLFunctionalExtras.h"
19 #include "llvm/ADT/StringMap.h"
20 #include "llvm/ADT/StringRef.h"
21 #include "llvm/BinaryFormat/Dwarf.h"
22 #include "llvm/CodeGen/DIE.h"
23 #include "llvm/CodeGen/DwarfStringPoolEntry.h"
24 #include "llvm/Support/Allocator.h"
25 #include "llvm/Support/DJB.h"
26 #include "llvm/Support/Debug.h"
27 #include <cstdint>
28 #include <vector>
29 
30 /// \file
31 /// The DWARF and Apple accelerator tables are an indirect hash table optimized
32 /// for null lookup rather than access to known data. The Apple accelerator
33 /// tables are a precursor of the newer DWARF v5 accelerator tables. Both
34 /// formats share common design ideas.
35 ///
36 /// The Apple accelerator table are output into an on-disk format that looks
37 /// like this:
38 ///
39 /// .------------------.
40 /// |  HEADER          |
41 /// |------------------|
42 /// |  BUCKETS         |
43 /// |------------------|
44 /// |  HASHES          |
45 /// |------------------|
46 /// |  OFFSETS         |
47 /// |------------------|
48 /// |  DATA            |
49 /// `------------------'
50 ///
51 /// The header contains a magic number, version, type of hash function,
52 /// the number of buckets, total number of hashes, and room for a special struct
53 /// of data and the length of that struct.
54 ///
55 /// The buckets contain an index (e.g. 6) into the hashes array. The hashes
56 /// section contains all of the 32-bit hash values in contiguous memory, and the
57 /// offsets contain the offset into the data area for the particular hash.
58 ///
59 /// For a lookup example, we could hash a function name and take it modulo the
60 /// number of buckets giving us our bucket. From there we take the bucket value
61 /// as an index into the hashes table and look at each successive hash as long
62 /// as the hash value is still the same modulo result (bucket value) as earlier.
63 /// If we have a match we look at that same entry in the offsets table and grab
64 /// the offset in the data for our final match.
65 ///
66 /// The DWARF v5 accelerator table consists of zero or more name indices that
67 /// are output into an on-disk format that looks like this:
68 ///
69 /// .------------------.
70 /// |  HEADER          |
71 /// |------------------|
72 /// |  CU LIST         |
73 /// |------------------|
74 /// |  LOCAL TU LIST   |
75 /// |------------------|
76 /// |  FOREIGN TU LIST |
77 /// |------------------|
78 /// |  HASH TABLE      |
79 /// |------------------|
80 /// |  NAME TABLE      |
81 /// |------------------|
82 /// |  ABBREV TABLE    |
83 /// |------------------|
84 /// |  ENTRY POOL      |
85 /// `------------------'
86 ///
87 /// For the full documentation please refer to the DWARF 5 standard.
88 ///
89 ///
90 /// This file defines the class template AccelTable, which is represents an
91 /// abstract view of an Accelerator table, without any notion of an on-disk
92 /// layout. This class is parameterized by an entry type, which should derive
93 /// from AccelTableData. This is the type of individual entries in the table,
94 /// and it should store the data necessary to emit them. AppleAccelTableData is
95 /// the base class for Apple Accelerator Table entries, which have a uniform
96 /// structure based on a sequence of Atoms. There are different sub-classes
97 /// derived from AppleAccelTable, which differ in the set of Atoms and how they
98 /// obtain their values.
99 ///
100 /// An Apple Accelerator Table can be serialized by calling emitAppleAccelTable
101 /// function.
102 
103 namespace llvm {
104 
105 class AsmPrinter;
106 class DwarfCompileUnit;
107 class DwarfDebug;
108 class MCSymbol;
109 class raw_ostream;
110 
111 /// Interface which the different types of accelerator table data have to
112 /// conform. It serves as a base class for different values of the template
113 /// argument of the AccelTable class template.
114 class AccelTableData {
115 public:
116   virtual ~AccelTableData() = default;
117 
118   bool operator<(const AccelTableData &Other) const {
119     return order() < Other.order();
120   }
121 
122     // Subclasses should implement:
123     // static uint32_t hash(StringRef Name);
124 
125 #ifndef NDEBUG
126   virtual void print(raw_ostream &OS) const = 0;
127 #endif
128 protected:
129   virtual uint64_t order() const = 0;
130 };
131 
132 /// A base class holding non-template-dependant functionality of the AccelTable
133 /// class. Clients should not use this class directly but rather instantiate
134 /// AccelTable with a type derived from AccelTableData.
135 class AccelTableBase {
136 public:
137   using HashFn = uint32_t(StringRef);
138 
139   /// Represents a group of entries with identical name (and hence, hash value).
140   struct HashData {
141     DwarfStringPoolEntryRef Name;
142     uint32_t HashValue;
143     std::vector<AccelTableData *> Values;
144     MCSymbol *Sym;
145 
146 #ifndef NDEBUG
147     void print(raw_ostream &OS) const;
148     void dump() const { print(dbgs()); }
149 #endif
150   };
151   using HashList = std::vector<HashData *>;
152   using BucketList = std::vector<HashList>;
153 
154 protected:
155   /// Allocator for HashData and Values.
156   BumpPtrAllocator Allocator;
157 
158   using StringEntries = MapVector<StringRef, HashData>;
159   StringEntries Entries;
160 
161   HashFn *Hash;
162   uint32_t BucketCount = 0;
163   uint32_t UniqueHashCount = 0;
164 
165   HashList Hashes;
166   BucketList Buckets;
167 
168   void computeBucketCount();
169 
170   AccelTableBase(HashFn *Hash) : Hash(Hash) {}
171 
172 public:
173   void finalize(AsmPrinter *Asm, StringRef Prefix);
174   ArrayRef<HashList> getBuckets() const { return Buckets; }
175   uint32_t getBucketCount() const { return BucketCount; }
176   uint32_t getUniqueHashCount() const { return UniqueHashCount; }
177   uint32_t getUniqueNameCount() const { return Entries.size(); }
178 
179 #ifndef NDEBUG
180   void print(raw_ostream &OS) const;
181   void dump() const { print(dbgs()); }
182 #endif
183 
184   AccelTableBase(const AccelTableBase &) = delete;
185   void operator=(const AccelTableBase &) = delete;
186 };
187 
188 /// This class holds an abstract representation of an Accelerator Table,
189 /// consisting of a sequence of buckets, each bucket containint a sequence of
190 /// HashData entries. The class is parameterized by the type of entries it
191 /// holds. The type template parameter also defines the hash function to use for
192 /// hashing names.
193 template <typename DataT> class AccelTable : public AccelTableBase {
194 public:
195   AccelTable() : AccelTableBase(DataT::hash) {}
196 
197   template <typename... Types>
198   void addName(DwarfStringPoolEntryRef Name, Types &&... Args);
199 };
200 
201 template <typename AccelTableDataT>
202 template <typename... Types>
203 void AccelTable<AccelTableDataT>::addName(DwarfStringPoolEntryRef Name,
204                                           Types &&... Args) {
205   assert(Buckets.empty() && "Already finalized!");
206   // If the string is in the list already then add this die to the list
207   // otherwise add a new one.
208   auto &It = Entries[Name.getString()];
209   if (It.Values.empty()) {
210     It.Name = Name;
211     It.HashValue = Hash(Name.getString());
212   }
213   It.Values.push_back(new (Allocator)
214                           AccelTableDataT(std::forward<Types>(Args)...));
215 }
216 
217 /// A base class for different implementations of Data classes for Apple
218 /// Accelerator Tables. The columns in the table are defined by the static Atoms
219 /// variable defined on the subclasses.
220 class AppleAccelTableData : public AccelTableData {
221 public:
222   /// An Atom defines the form of the data in an Apple accelerator table.
223   /// Conceptually it is a column in the accelerator consisting of a type and a
224   /// specification of the form of its data.
225   struct Atom {
226     /// Atom Type.
227     const uint16_t Type;
228     /// DWARF Form.
229     const uint16_t Form;
230 
231     constexpr Atom(uint16_t Type, uint16_t Form) : Type(Type), Form(Form) {}
232 
233 #ifndef NDEBUG
234     void print(raw_ostream &OS) const;
235     void dump() const { print(dbgs()); }
236 #endif
237   };
238   // Subclasses should define:
239   // static constexpr Atom Atoms[];
240 
241   virtual void emit(AsmPrinter *Asm) const = 0;
242 
243   static uint32_t hash(StringRef Buffer) { return djbHash(Buffer); }
244 };
245 
246 /// The Data class implementation for DWARF v5 accelerator table. Unlike the
247 /// Apple Data classes, this class is just a DIE wrapper, and does not know to
248 /// serialize itself. The complete serialization logic is in the
249 /// emitDWARF5AccelTable function.
250 class DWARF5AccelTableData : public AccelTableData {
251 public:
252   static uint32_t hash(StringRef Name) { return caseFoldingDjbHash(Name); }
253 
254   DWARF5AccelTableData(const DIE &Die) : Die(Die) {}
255 
256 #ifndef NDEBUG
257   void print(raw_ostream &OS) const override;
258 #endif
259 
260   const DIE &getDie() const { return Die; }
261   uint64_t getDieOffset() const { return Die.getOffset(); }
262   unsigned getDieTag() const { return Die.getTag(); }
263 
264 protected:
265   const DIE &Die;
266 
267   uint64_t order() const override { return Die.getOffset(); }
268 };
269 
270 class DWARF5AccelTableStaticData : public AccelTableData {
271 public:
272   static uint32_t hash(StringRef Name) { return caseFoldingDjbHash(Name); }
273 
274   DWARF5AccelTableStaticData(uint64_t DieOffset, unsigned DieTag,
275                              unsigned CUIndex)
276       : DieOffset(DieOffset), DieTag(DieTag), CUIndex(CUIndex) {}
277 
278 #ifndef NDEBUG
279   void print(raw_ostream &OS) const override;
280 #endif
281 
282   uint64_t getDieOffset() const { return DieOffset; }
283   unsigned getDieTag() const { return DieTag; }
284   unsigned getCUIndex() const { return CUIndex; }
285 
286 protected:
287   uint64_t DieOffset;
288   unsigned DieTag;
289   unsigned CUIndex;
290 
291   uint64_t order() const override { return DieOffset; }
292 };
293 
294 void emitAppleAccelTableImpl(AsmPrinter *Asm, AccelTableBase &Contents,
295                              StringRef Prefix, const MCSymbol *SecBegin,
296                              ArrayRef<AppleAccelTableData::Atom> Atoms);
297 
298 /// Emit an Apple Accelerator Table consisting of entries in the specified
299 /// AccelTable. The DataT template parameter should be derived from
300 /// AppleAccelTableData.
301 template <typename DataT>
302 void emitAppleAccelTable(AsmPrinter *Asm, AccelTable<DataT> &Contents,
303                          StringRef Prefix, const MCSymbol *SecBegin) {
304   static_assert(std::is_convertible<DataT *, AppleAccelTableData *>::value);
305   emitAppleAccelTableImpl(Asm, Contents, Prefix, SecBegin, DataT::Atoms);
306 }
307 
308 void emitDWARF5AccelTable(AsmPrinter *Asm,
309                           AccelTable<DWARF5AccelTableData> &Contents,
310                           const DwarfDebug &DD,
311                           ArrayRef<std::unique_ptr<DwarfCompileUnit>> CUs);
312 
313 void emitDWARF5AccelTable(
314     AsmPrinter *Asm, AccelTable<DWARF5AccelTableStaticData> &Contents,
315     ArrayRef<MCSymbol *> CUs,
316     llvm::function_ref<unsigned(const DWARF5AccelTableStaticData &)>
317         getCUIndexForEntry);
318 
319 /// Accelerator table data implementation for simple Apple accelerator tables
320 /// with just a DIE reference.
321 class AppleAccelTableOffsetData : public AppleAccelTableData {
322 public:
323   AppleAccelTableOffsetData(const DIE &D) : Die(D) {}
324 
325   void emit(AsmPrinter *Asm) const override;
326 
327   static constexpr Atom Atoms[] = {
328       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4)};
329 
330 #ifndef NDEBUG
331   void print(raw_ostream &OS) const override;
332 #endif
333 protected:
334   uint64_t order() const override { return Die.getOffset(); }
335 
336   const DIE &Die;
337 };
338 
339 /// Accelerator table data implementation for Apple type accelerator tables.
340 class AppleAccelTableTypeData : public AppleAccelTableOffsetData {
341 public:
342   AppleAccelTableTypeData(const DIE &D) : AppleAccelTableOffsetData(D) {}
343 
344   void emit(AsmPrinter *Asm) const override;
345 
346   static constexpr Atom Atoms[] = {
347       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4),
348       Atom(dwarf::DW_ATOM_die_tag, dwarf::DW_FORM_data2),
349       Atom(dwarf::DW_ATOM_type_flags, dwarf::DW_FORM_data1)};
350 
351 #ifndef NDEBUG
352   void print(raw_ostream &OS) const override;
353 #endif
354 };
355 
356 /// Accelerator table data implementation for simple Apple accelerator tables
357 /// with a DIE offset but no actual DIE pointer.
358 class AppleAccelTableStaticOffsetData : public AppleAccelTableData {
359 public:
360   AppleAccelTableStaticOffsetData(uint32_t Offset) : Offset(Offset) {}
361 
362   void emit(AsmPrinter *Asm) const override;
363 
364   static constexpr Atom Atoms[] = {
365       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4)};
366 
367 #ifndef NDEBUG
368   void print(raw_ostream &OS) const override;
369 #endif
370 protected:
371   uint64_t order() const override { return Offset; }
372 
373   uint32_t Offset;
374 };
375 
376 /// Accelerator table data implementation for type accelerator tables with
377 /// a DIE offset but no actual DIE pointer.
378 class AppleAccelTableStaticTypeData : public AppleAccelTableStaticOffsetData {
379 public:
380   AppleAccelTableStaticTypeData(uint32_t Offset, uint16_t Tag,
381                                 bool ObjCClassIsImplementation,
382                                 uint32_t QualifiedNameHash)
383       : AppleAccelTableStaticOffsetData(Offset),
384         QualifiedNameHash(QualifiedNameHash), Tag(Tag),
385         ObjCClassIsImplementation(ObjCClassIsImplementation) {}
386 
387   void emit(AsmPrinter *Asm) const override;
388 
389   static constexpr Atom Atoms[] = {
390       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4),
391       Atom(dwarf::DW_ATOM_die_tag, dwarf::DW_FORM_data2),
392       Atom(5, dwarf::DW_FORM_data1), Atom(6, dwarf::DW_FORM_data4)};
393 
394 #ifndef NDEBUG
395   void print(raw_ostream &OS) const override;
396 #endif
397 protected:
398   uint64_t order() const override { return Offset; }
399 
400   uint32_t QualifiedNameHash;
401   uint16_t Tag;
402   bool ObjCClassIsImplementation;
403 };
404 
405 } // end namespace llvm
406 
407 #endif // LLVM_CODEGEN_ACCELTABLE_H
408