Home | History | Annotate | Download | only in CodeGen
      1 //==- include/llvm/CodeGen/AccelTable.h - Accelerator Tables -----*- C++ -*-==//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This file contains support for writing accelerator tables.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 #ifndef LLVM_CODEGEN_DWARFACCELTABLE_H
     15 #define LLVM_CODEGEN_DWARFACCELTABLE_H
     16 
     17 #include "llvm/ADT/ArrayRef.h"
     18 #include "llvm/ADT/SmallVector.h"
     19 #include "llvm/ADT/StringMap.h"
     20 #include "llvm/ADT/StringRef.h"
     21 #include "llvm/BinaryFormat/Dwarf.h"
     22 #include "llvm/CodeGen/DIE.h"
     23 #include "llvm/CodeGen/DwarfStringPoolEntry.h"
     24 #include "llvm/MC/MCSymbol.h"
     25 #include "llvm/Support/Allocator.h"
     26 #include "llvm/Support/DJB.h"
     27 #include "llvm/Support/Debug.h"
     28 #include "llvm/Support/Format.h"
     29 #include "llvm/Support/raw_ostream.h"
     30 #include <cstddef>
     31 #include <cstdint>
     32 #include <vector>
     33 
     34 /// The DWARF and Apple accelerator tables are an indirect hash table optimized
     35 /// for null lookup rather than access to known data. The Apple accelerator
     36 /// tables are a precursor of the newer DWARF v5 accelerator tables. Both
     37 /// formats share common design ideas.
     38 ///
     39 /// The Apple accelerator table are output into an on-disk format that looks
     40 /// like this:
     41 ///
     42 /// .------------------.
     43 /// |  HEADER          |
     44 /// |------------------|
     45 /// |  BUCKETS         |
     46 /// |------------------|
     47 /// |  HASHES          |
     48 /// |------------------|
     49 /// |  OFFSETS         |
     50 /// |------------------|
     51 /// |  DATA            |
     52 /// `------------------'
     53 ///
     54 /// The header contains a magic number, version, type of hash function,
     55 /// the number of buckets, total number of hashes, and room for a special struct
     56 /// of data and the length of that struct.
     57 ///
     58 /// The buckets contain an index (e.g. 6) into the hashes array. The hashes
     59 /// section contains all of the 32-bit hash values in contiguous memory, and the
     60 /// offsets contain the offset into the data area for the particular hash.
     61 ///
     62 /// For a lookup example, we could hash a function name and take it modulo the
     63 /// number of buckets giving us our bucket. From there we take the bucket value
     64 /// as an index into the hashes table and look at each successive hash as long
     65 /// as the hash value is still the same modulo result (bucket value) as earlier.
     66 /// If we have a match we look at that same entry in the offsets table and grab
     67 /// the offset in the data for our final match.
     68 ///
     69 /// The DWARF v5 accelerator table consists of zero or more name indices that
     70 /// are output into an on-disk format that looks like this:
     71 ///
     72 /// .------------------.
     73 /// |  HEADER          |
     74 /// |------------------|
     75 /// |  CU LIST         |
     76 /// |------------------|
     77 /// |  LOCAL TU LIST   |
     78 /// |------------------|
     79 /// |  FOREIGN TU LIST |
     80 /// |------------------|
     81 /// |  HASH TABLE      |
     82 /// |------------------|
     83 /// |  NAME TABLE      |
     84 /// |------------------|
     85 /// |  ABBREV TABLE    |
     86 /// |------------------|
     87 /// |  ENTRY POOL      |
     88 /// `------------------'
     89 ///
     90 /// For the full documentation please refer to the DWARF 5 standard.
     91 ///
     92 ///
     93 /// This file defines the class template AccelTable, which is represents an
     94 /// abstract view of an Accelerator table, without any notion of an on-disk
     95 /// layout. This class is parameterized by an entry type, which should derive
     96 /// from AccelTableData. This is the type of individual entries in the table,
     97 /// and it should store the data necessary to emit them. AppleAccelTableData is
     98 /// the base class for Apple Accelerator Table entries, which have a uniform
     99 /// structure based on a sequence of Atoms. There are different sub-classes
    100 /// derived from AppleAccelTable, which differ in the set of Atoms and how they
    101 /// obtain their values.
    102 ///
    103 /// An Apple Accelerator Table can be serialized by calling emitAppleAccelTable
    104 /// function.
    105 ///
    106 /// TODO: Add DWARF v5 emission code.
    107 
    108 namespace llvm {
    109 
    110 class AsmPrinter;
    111 class DwarfCompileUnit;
    112 class DwarfDebug;
    113 
    114 /// Interface which the different types of accelerator table data have to
    115 /// conform. It serves as a base class for different values of the template
    116 /// argument of the AccelTable class template.
    117 class AccelTableData {
    118 public:
    119   virtual ~AccelTableData() = default;
    120 
    121   bool operator<(const AccelTableData &Other) const {
    122     return order() < Other.order();
    123   }
    124 
    125     // Subclasses should implement:
    126     // static uint32_t hash(StringRef Name);
    127 
    128 #ifndef NDEBUG
    129   virtual void print(raw_ostream &OS) const = 0;
    130 #endif
    131 protected:
    132   virtual uint64_t order() const = 0;
    133 };
    134 
    135 /// A base class holding non-template-dependant functionality of the AccelTable
    136 /// class. Clients should not use this class directly but rather instantiate
    137 /// AccelTable with a type derived from AccelTableData.
    138 class AccelTableBase {
    139 public:
    140   using HashFn = uint32_t(StringRef);
    141 
    142   /// Represents a group of entries with identical name (and hence, hash value).
    143   struct HashData {
    144     DwarfStringPoolEntryRef Name;
    145     uint32_t HashValue;
    146     std::vector<AccelTableData *> Values;
    147     MCSymbol *Sym;
    148 
    149     HashData(DwarfStringPoolEntryRef Name, HashFn *Hash)
    150         : Name(Name), HashValue(Hash(Name.getString())) {}
    151 
    152 #ifndef NDEBUG
    153     void print(raw_ostream &OS) const;
    154     void dump() const { print(dbgs()); }
    155 #endif
    156   };
    157   using HashList = std::vector<HashData *>;
    158   using BucketList = std::vector<HashList>;
    159 
    160 protected:
    161   /// Allocator for HashData and Values.
    162   BumpPtrAllocator Allocator;
    163 
    164   using StringEntries = StringMap<HashData, BumpPtrAllocator &>;
    165   StringEntries Entries;
    166 
    167   HashFn *Hash;
    168   uint32_t BucketCount;
    169   uint32_t UniqueHashCount;
    170 
    171   HashList Hashes;
    172   BucketList Buckets;
    173 
    174   void computeBucketCount();
    175 
    176   AccelTableBase(HashFn *Hash) : Entries(Allocator), Hash(Hash) {}
    177 
    178 public:
    179   void finalize(AsmPrinter *Asm, StringRef Prefix);
    180   ArrayRef<HashList> getBuckets() const { return Buckets; }
    181   uint32_t getBucketCount() const { return BucketCount; }
    182   uint32_t getUniqueHashCount() const { return UniqueHashCount; }
    183   uint32_t getUniqueNameCount() const { return Entries.size(); }
    184 
    185 #ifndef NDEBUG
    186   void print(raw_ostream &OS) const;
    187   void dump() const { print(dbgs()); }
    188 #endif
    189 
    190   AccelTableBase(const AccelTableBase &) = delete;
    191   void operator=(const AccelTableBase &) = delete;
    192 };
    193 
    194 /// This class holds an abstract representation of an Accelerator Table,
    195 /// consisting of a sequence of buckets, each bucket containint a sequence of
    196 /// HashData entries. The class is parameterized by the type of entries it
    197 /// holds. The type template parameter also defines the hash function to use for
    198 /// hashing names.
    199 template <typename DataT> class AccelTable : public AccelTableBase {
    200 public:
    201   AccelTable() : AccelTableBase(DataT::hash) {}
    202 
    203   template <typename... Types>
    204   void addName(DwarfStringPoolEntryRef Name, Types &&... Args);
    205 };
    206 
    207 template <typename AccelTableDataT>
    208 template <typename... Types>
    209 void AccelTable<AccelTableDataT>::addName(DwarfStringPoolEntryRef Name,
    210                                           Types &&... Args) {
    211   assert(Buckets.empty() && "Already finalized!");
    212   // If the string is in the list already then add this die to the list
    213   // otherwise add a new one.
    214   auto Iter = Entries.try_emplace(Name.getString(), Name, Hash).first;
    215   assert(Iter->second.Name == Name);
    216   Iter->second.Values.push_back(
    217       new (Allocator) AccelTableDataT(std::forward<Types>(Args)...));
    218 }
    219 
    220 /// A base class for different implementations of Data classes for Apple
    221 /// Accelerator Tables. The columns in the table are defined by the static Atoms
    222 /// variable defined on the subclasses.
    223 class AppleAccelTableData : public AccelTableData {
    224 public:
    225   /// An Atom defines the form of the data in an Apple accelerator table.
    226   /// Conceptually it is a column in the accelerator consisting of a type and a
    227   /// specification of the form of its data.
    228   struct Atom {
    229     /// Atom Type.
    230     const uint16_t Type;
    231     /// DWARF Form.
    232     const uint16_t Form;
    233 
    234     constexpr Atom(uint16_t Type, uint16_t Form) : Type(Type), Form(Form) {}
    235 
    236 #ifndef NDEBUG
    237     void print(raw_ostream &OS) const;
    238     void dump() const { print(dbgs()); }
    239 #endif
    240   };
    241   // Subclasses should define:
    242   // static constexpr Atom Atoms[];
    243 
    244   virtual void emit(AsmPrinter *Asm) const = 0;
    245 
    246   static uint32_t hash(StringRef Buffer) { return djbHash(Buffer); }
    247 };
    248 
    249 /// The Data class implementation for DWARF v5 accelerator table. Unlike the
    250 /// Apple Data classes, this class is just a DIE wrapper, and does not know to
    251 /// serialize itself. The complete serialization logic is in the
    252 /// emitDWARF5AccelTable function.
    253 class DWARF5AccelTableData : public AccelTableData {
    254 public:
    255   static uint32_t hash(StringRef Name) { return caseFoldingDjbHash(Name); }
    256 
    257   DWARF5AccelTableData(const DIE &Die) : Die(Die) {}
    258 
    259 #ifndef NDEBUG
    260   void print(raw_ostream &OS) const override;
    261 #endif
    262 
    263   const DIE &getDie() const { return Die; }
    264   uint64_t getDieOffset() const { return Die.getOffset(); }
    265   unsigned getDieTag() const { return Die.getTag(); }
    266 
    267 protected:
    268   const DIE &Die;
    269 
    270   uint64_t order() const override { return Die.getOffset(); }
    271 };
    272 
    273 class DWARF5AccelTableStaticData : public AccelTableData {
    274 public:
    275   static uint32_t hash(StringRef Name) { return caseFoldingDjbHash(Name); }
    276 
    277   DWARF5AccelTableStaticData(uint64_t DieOffset, unsigned DieTag,
    278                              unsigned CUIndex)
    279       : DieOffset(DieOffset), DieTag(DieTag), CUIndex(CUIndex) {}
    280 
    281 #ifndef NDEBUG
    282   void print(raw_ostream &OS) const override;
    283 #endif
    284 
    285   uint64_t getDieOffset() const { return DieOffset; }
    286   unsigned getDieTag() const { return DieTag; }
    287   unsigned getCUIndex() const { return CUIndex; }
    288 
    289 protected:
    290   uint64_t DieOffset;
    291   unsigned DieTag;
    292   unsigned CUIndex;
    293 
    294   uint64_t order() const override { return DieOffset; }
    295 };
    296 
    297 void emitAppleAccelTableImpl(AsmPrinter *Asm, AccelTableBase &Contents,
    298                              StringRef Prefix, const MCSymbol *SecBegin,
    299                              ArrayRef<AppleAccelTableData::Atom> Atoms);
    300 
    301 /// Emit an Apple Accelerator Table consisting of entries in the specified
    302 /// AccelTable. The DataT template parameter should be derived from
    303 /// AppleAccelTableData.
    304 template <typename DataT>
    305 void emitAppleAccelTable(AsmPrinter *Asm, AccelTable<DataT> &Contents,
    306                          StringRef Prefix, const MCSymbol *SecBegin) {
    307   static_assert(std::is_convertible<DataT *, AppleAccelTableData *>::value, "");
    308   emitAppleAccelTableImpl(Asm, Contents, Prefix, SecBegin, DataT::Atoms);
    309 }
    310 
    311 void emitDWARF5AccelTable(AsmPrinter *Asm,
    312                           AccelTable<DWARF5AccelTableData> &Contents,
    313                           const DwarfDebug &DD,
    314                           ArrayRef<std::unique_ptr<DwarfCompileUnit>> CUs);
    315 
    316 void emitDWARF5AccelTable(
    317     AsmPrinter *Asm, AccelTable<DWARF5AccelTableStaticData> &Contents,
    318     ArrayRef<MCSymbol *> CUs,
    319     llvm::function_ref<unsigned(const DWARF5AccelTableStaticData &)>
    320         getCUIndexForEntry);
    321 
    322 /// Accelerator table data implementation for simple Apple accelerator tables
    323 /// with just a DIE reference.
    324 class AppleAccelTableOffsetData : public AppleAccelTableData {
    325 public:
    326   AppleAccelTableOffsetData(const DIE &D) : Die(D) {}
    327 
    328   void emit(AsmPrinter *Asm) const override;
    329 
    330 #ifndef _MSC_VER
    331   // The line below is rejected by older versions (TBD) of MSVC.
    332   static constexpr Atom Atoms[] = {
    333       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4)};
    334 #else
    335   // FIXME: Erase this path once the minimum MSCV version has been bumped.
    336   static const SmallVector<Atom, 4> Atoms;
    337 #endif
    338 
    339 #ifndef NDEBUG
    340   void print(raw_ostream &OS) const override;
    341 #endif
    342 protected:
    343   uint64_t order() const override { return Die.getOffset(); }
    344 
    345   const DIE &Die;
    346 };
    347 
    348 /// Accelerator table data implementation for Apple type accelerator tables.
    349 class AppleAccelTableTypeData : public AppleAccelTableOffsetData {
    350 public:
    351   AppleAccelTableTypeData(const DIE &D) : AppleAccelTableOffsetData(D) {}
    352 
    353   void emit(AsmPrinter *Asm) const override;
    354 
    355 #ifndef _MSC_VER
    356   // The line below is rejected by older versions (TBD) of MSVC.
    357   static constexpr Atom Atoms[] = {
    358       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4),
    359       Atom(dwarf::DW_ATOM_die_tag, dwarf::DW_FORM_data2),
    360       Atom(dwarf::DW_ATOM_type_flags, dwarf::DW_FORM_data1)};
    361 #else
    362   // FIXME: Erase this path once the minimum MSCV version has been bumped.
    363   static const SmallVector<Atom, 4> Atoms;
    364 #endif
    365 
    366 #ifndef NDEBUG
    367   void print(raw_ostream &OS) const override;
    368 #endif
    369 };
    370 
    371 /// Accelerator table data implementation for simple Apple accelerator tables
    372 /// with a DIE offset but no actual DIE pointer.
    373 class AppleAccelTableStaticOffsetData : public AppleAccelTableData {
    374 public:
    375   AppleAccelTableStaticOffsetData(uint32_t Offset) : Offset(Offset) {}
    376 
    377   void emit(AsmPrinter *Asm) const override;
    378 
    379 #ifndef _MSC_VER
    380   // The line below is rejected by older versions (TBD) of MSVC.
    381   static constexpr Atom Atoms[] = {
    382       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4)};
    383 #else
    384   // FIXME: Erase this path once the minimum MSCV version has been bumped.
    385   static const SmallVector<Atom, 4> Atoms;
    386 #endif
    387 
    388 #ifndef NDEBUG
    389   void print(raw_ostream &OS) const override;
    390 #endif
    391 protected:
    392   uint64_t order() const override { return Offset; }
    393 
    394   uint32_t Offset;
    395 };
    396 
    397 /// Accelerator table data implementation for type accelerator tables with
    398 /// a DIE offset but no actual DIE pointer.
    399 class AppleAccelTableStaticTypeData : public AppleAccelTableStaticOffsetData {
    400 public:
    401   AppleAccelTableStaticTypeData(uint32_t Offset, uint16_t Tag,
    402                                 bool ObjCClassIsImplementation,
    403                                 uint32_t QualifiedNameHash)
    404       : AppleAccelTableStaticOffsetData(Offset),
    405         QualifiedNameHash(QualifiedNameHash), Tag(Tag),
    406         ObjCClassIsImplementation(ObjCClassIsImplementation) {}
    407 
    408   void emit(AsmPrinter *Asm) const override;
    409 
    410 #ifndef _MSC_VER
    411   // The line below is rejected by older versions (TBD) of MSVC.
    412   static constexpr Atom Atoms[] = {
    413       Atom(dwarf::DW_ATOM_die_offset, dwarf::DW_FORM_data4),
    414       Atom(dwarf::DW_ATOM_die_tag, dwarf::DW_FORM_data2),
    415       Atom(5, dwarf::DW_FORM_data1), Atom(6, dwarf::DW_FORM_data4)};
    416 #else
    417   // FIXME: Erase this path once the minimum MSCV version has been bumped.
    418   static const SmallVector<Atom, 4> Atoms;
    419 #endif
    420 
    421 #ifndef NDEBUG
    422   void print(raw_ostream &OS) const override;
    423 #endif
    424 protected:
    425   uint64_t order() const override { return Offset; }
    426 
    427   uint32_t QualifiedNameHash;
    428   uint16_t Tag;
    429   bool ObjCClassIsImplementation;
    430 };
    431 
    432 } // end namespace llvm
    433 
    434 #endif // LLVM_CODEGEN_DWARFACCELTABLE_H
    435