xref: /llvm-project/llvm/lib/DebugInfo/PDB/Native/PDBStringTable.cpp (revision ed98c1b37661b0795a5e34517941485f0f0688d1)
1c504ae3cSZachary Turner //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2e204a6c9SZachary Turner //
3*2946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*2946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
5*2946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6e204a6c9SZachary Turner //
7e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
8e204a6c9SZachary Turner 
9e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
10e204a6c9SZachary Turner 
11e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
12e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawError.h"
13e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
14e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamReader.h"
15e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
16e204a6c9SZachary Turner 
17e204a6c9SZachary Turner using namespace llvm;
18e204a6c9SZachary Turner using namespace llvm::support;
19e204a6c9SZachary Turner using namespace llvm::pdb;
20e204a6c9SZachary Turner 
getByteSize() const21f3b4b2d8SZachary Turner uint32_t PDBStringTable::getByteSize() const { return Header->ByteSize; }
getNameCount() const22c504ae3cSZachary Turner uint32_t PDBStringTable::getNameCount() const { return NameCount; }
getHashVersion() const23c504ae3cSZachary Turner uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
getSignature() const24c504ae3cSZachary Turner uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
25e204a6c9SZachary Turner 
readHeader(BinaryStreamReader & Reader)26c504ae3cSZachary Turner Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
27c504ae3cSZachary Turner   if (auto EC = Reader.readObject(Header))
28e204a6c9SZachary Turner     return EC;
29e204a6c9SZachary Turner 
30c504ae3cSZachary Turner   if (Header->Signature != PDBStringTableSignature)
31e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
32e204a6c9SZachary Turner                                 "Invalid hash table signature");
33c504ae3cSZachary Turner   if (Header->HashVersion != 1 && Header->HashVersion != 2)
34e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
35e204a6c9SZachary Turner                                 "Unsupported hash version");
36e204a6c9SZachary Turner 
37c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
38c504ae3cSZachary Turner   return Error::success();
39c504ae3cSZachary Turner }
40c504ae3cSZachary Turner 
readStrings(BinaryStreamReader & Reader)41c504ae3cSZachary Turner Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
422d5c2cd3SZachary Turner   BinaryStreamRef Stream;
432d5c2cd3SZachary Turner   if (auto EC = Reader.readStreamRef(Stream))
442d5c2cd3SZachary Turner     return EC;
452d5c2cd3SZachary Turner 
462d5c2cd3SZachary Turner   if (auto EC = Strings.initialize(Stream)) {
47e204a6c9SZachary Turner     return joinErrors(std::move(EC),
48e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
49e204a6c9SZachary Turner                                            "Invalid hash table byte length"));
50c504ae3cSZachary Turner   }
51e204a6c9SZachary Turner 
52c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
53c504ae3cSZachary Turner   return Error::success();
54c504ae3cSZachary Turner }
55c504ae3cSZachary Turner 
56a8cfc29cSZachary Turner const codeview::DebugStringTableSubsectionRef &
getStringTable() const57a8cfc29cSZachary Turner PDBStringTable::getStringTable() const {
5892dcdda6SZachary Turner   return Strings;
5992dcdda6SZachary Turner }
6092dcdda6SZachary Turner 
readHashTable(BinaryStreamReader & Reader)61c504ae3cSZachary Turner Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
62e204a6c9SZachary Turner   const support::ulittle32_t *HashCount;
63c504ae3cSZachary Turner   if (auto EC = Reader.readObject(HashCount))
64e204a6c9SZachary Turner     return EC;
65e204a6c9SZachary Turner 
66c504ae3cSZachary Turner   if (auto EC = Reader.readArray(IDs, *HashCount)) {
67e204a6c9SZachary Turner     return joinErrors(std::move(EC),
68e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
69e204a6c9SZachary Turner                                            "Could not read bucket array"));
70c504ae3cSZachary Turner   }
71e204a6c9SZachary Turner 
72e204a6c9SZachary Turner   return Error::success();
73e204a6c9SZachary Turner }
74e204a6c9SZachary Turner 
readEpilogue(BinaryStreamReader & Reader)75c504ae3cSZachary Turner Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
76c504ae3cSZachary Turner   if (auto EC = Reader.readInteger(NameCount))
77c504ae3cSZachary Turner     return EC;
78c504ae3cSZachary Turner 
79c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
80c504ae3cSZachary Turner   return Error::success();
81c504ae3cSZachary Turner }
82c504ae3cSZachary Turner 
reload(BinaryStreamReader & Reader)83c504ae3cSZachary Turner Error PDBStringTable::reload(BinaryStreamReader &Reader) {
84c504ae3cSZachary Turner 
85c504ae3cSZachary Turner   BinaryStreamReader SectionReader;
86c504ae3cSZachary Turner 
87c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
88c504ae3cSZachary Turner   if (auto EC = readHeader(SectionReader))
89c504ae3cSZachary Turner     return EC;
90c504ae3cSZachary Turner 
91c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
92c504ae3cSZachary Turner   if (auto EC = readStrings(SectionReader))
93c504ae3cSZachary Turner     return EC;
94c504ae3cSZachary Turner 
95c504ae3cSZachary Turner   // We don't know how long the hash table is until we parse it, so let the
96c504ae3cSZachary Turner   // function responsible for doing that figure it out.
97c504ae3cSZachary Turner   if (auto EC = readHashTable(Reader))
98c504ae3cSZachary Turner     return EC;
99c504ae3cSZachary Turner 
100c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
101c504ae3cSZachary Turner   if (auto EC = readEpilogue(SectionReader))
102c504ae3cSZachary Turner     return EC;
103c504ae3cSZachary Turner 
104c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
105c504ae3cSZachary Turner   return Error::success();
106c504ae3cSZachary Turner }
107e204a6c9SZachary Turner 
getStringForID(uint32_t ID) const1082d5c2cd3SZachary Turner Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
109c504ae3cSZachary Turner   return Strings.getString(ID);
110e204a6c9SZachary Turner }
111e204a6c9SZachary Turner 
getIDForString(StringRef Str) const1122d5c2cd3SZachary Turner Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
113c504ae3cSZachary Turner   uint32_t Hash =
114c504ae3cSZachary Turner       (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
115e204a6c9SZachary Turner   size_t Count = IDs.size();
116e204a6c9SZachary Turner   uint32_t Start = Hash % Count;
117e204a6c9SZachary Turner   for (size_t I = 0; I < Count; ++I) {
118e204a6c9SZachary Turner     // The hash is just a starting point for the search, but if it
119e204a6c9SZachary Turner     // doesn't work we should find the string no matter what, because
120e204a6c9SZachary Turner     // we iterate the entire array.
121e204a6c9SZachary Turner     uint32_t Index = (Start + I) % Count;
122e204a6c9SZachary Turner 
123eb629994SZachary Turner     // If we find 0, it means the item isn't in the hash table.
124e204a6c9SZachary Turner     uint32_t ID = IDs[Index];
125eb629994SZachary Turner     if (ID == 0)
126eb629994SZachary Turner       return make_error<RawError>(raw_error_code::no_entry);
1272d5c2cd3SZachary Turner     auto ExpectedStr = getStringForID(ID);
1282d5c2cd3SZachary Turner     if (!ExpectedStr)
1292d5c2cd3SZachary Turner       return ExpectedStr.takeError();
1302d5c2cd3SZachary Turner 
1312d5c2cd3SZachary Turner     if (*ExpectedStr == Str)
132e204a6c9SZachary Turner       return ID;
133e204a6c9SZachary Turner   }
1342d5c2cd3SZachary Turner   return make_error<RawError>(raw_error_code::no_entry);
135e204a6c9SZachary Turner }
136e204a6c9SZachary Turner 
name_ids() const137e204a6c9SZachary Turner FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
138e204a6c9SZachary Turner   return IDs;
139e204a6c9SZachary Turner }
140