xref: /llvm-project/llvm/lib/DebugInfo/PDB/Native/PDBStringTableBuilder.cpp (revision eb629994554a05a4d3e59d6b5c09d312416d096e)
1 //===- PDBStringTableBuilder.cpp - PDB String Table -------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "llvm/DebugInfo/PDB/Native/PDBStringTableBuilder.h"
11 
12 #include "llvm/ADT/ArrayRef.h"
13 #include "llvm/DebugInfo/PDB/Native/Hash.h"
14 #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
15 #include "llvm/Support/BinaryStreamWriter.h"
16 #include "llvm/Support/Endian.h"
17 
18 using namespace llvm;
19 using namespace llvm::msf;
20 using namespace llvm::support;
21 using namespace llvm::support::endian;
22 using namespace llvm::pdb;
23 
24 uint32_t PDBStringTableBuilder::insert(StringRef S) {
25   return Strings.insert(S);
26 }
27 
28 static uint32_t computeBucketCount(uint32_t NumStrings) {
29   // The /names stream is basically an on-disk open-addressing hash table.
30   // Hash collisions are resolved by linear probing. We cannot make
31   // utilization 100% because it will make the linear probing extremely
32   // slow. But lower utilization wastes disk space. As a reasonable
33   // load factor, we choose 80%. We need +1 because slot 0 is reserved.
34   return (NumStrings + 1) * 1.25;
35 }
36 
37 uint32_t PDBStringTableBuilder::calculateHashTableSize() const {
38   uint32_t Size = sizeof(uint32_t); // Hash table begins with 4-byte size field.
39   Size += sizeof(uint32_t) * computeBucketCount(Strings.size());
40 
41   return Size;
42 }
43 
44 uint32_t PDBStringTableBuilder::calculateSerializedSize() const {
45   uint32_t Size = 0;
46   Size += sizeof(PDBStringTableHeader);
47   Size += Strings.calculateSerializedSize();
48   Size += calculateHashTableSize();
49   Size += sizeof(uint32_t); // The /names stream ends with the string count.
50   return Size;
51 }
52 
53 void PDBStringTableBuilder::setStrings(
54     const codeview::DebugStringTableSubsection &Strings) {
55   this->Strings = Strings;
56 }
57 
58 Error PDBStringTableBuilder::writeHeader(BinaryStreamWriter &Writer) const {
59   // Write a header
60   PDBStringTableHeader H;
61   H.Signature = PDBStringTableSignature;
62   H.HashVersion = 1;
63   H.ByteSize = Strings.calculateSerializedSize();
64   if (auto EC = Writer.writeObject(H))
65     return EC;
66   assert(Writer.bytesRemaining() == 0);
67   return Error::success();
68 }
69 
70 Error PDBStringTableBuilder::writeStrings(BinaryStreamWriter &Writer) const {
71   if (auto EC = Strings.commit(Writer))
72     return EC;
73 
74   assert(Writer.bytesRemaining() == 0);
75   return Error::success();
76 }
77 
78 Error PDBStringTableBuilder::writeHashTable(BinaryStreamWriter &Writer) const {
79   // Write a hash table.
80   uint32_t BucketCount = computeBucketCount(Strings.size());
81   if (auto EC = Writer.writeInteger(BucketCount))
82     return EC;
83   std::vector<ulittle32_t> Buckets(BucketCount);
84 
85   for (auto &Pair : Strings) {
86     StringRef S = Pair.getKey();
87     uint32_t Offset = Pair.getValue();
88     uint32_t Hash = hashStringV1(S);
89 
90     for (uint32_t I = 0; I != BucketCount; ++I) {
91       uint32_t Slot = (Hash + I) % BucketCount;
92       if (Buckets[Slot] != 0)
93         continue;
94       Buckets[Slot] = Offset;
95       break;
96     }
97   }
98 
99   if (auto EC = Writer.writeArray(ArrayRef<ulittle32_t>(Buckets)))
100     return EC;
101 
102   assert(Writer.bytesRemaining() == 0);
103   return Error::success();
104 }
105 
106 Error PDBStringTableBuilder::writeEpilogue(BinaryStreamWriter &Writer) const {
107   if (auto EC = Writer.writeInteger<uint32_t>(Strings.size()))
108     return EC;
109   assert(Writer.bytesRemaining() == 0);
110   return Error::success();
111 }
112 
113 Error PDBStringTableBuilder::commit(BinaryStreamWriter &Writer) const {
114   BinaryStreamWriter SectionWriter;
115 
116   std::tie(SectionWriter, Writer) = Writer.split(sizeof(PDBStringTableHeader));
117   if (auto EC = writeHeader(SectionWriter))
118     return EC;
119 
120   std::tie(SectionWriter, Writer) =
121       Writer.split(Strings.calculateSerializedSize());
122   if (auto EC = writeStrings(SectionWriter))
123     return EC;
124 
125   std::tie(SectionWriter, Writer) = Writer.split(calculateHashTableSize());
126   if (auto EC = writeHashTable(SectionWriter))
127     return EC;
128 
129   std::tie(SectionWriter, Writer) = Writer.split(sizeof(uint32_t));
130   if (auto EC = writeEpilogue(SectionWriter))
131     return EC;
132 
133   return Error::success();
134 }
135