1*0b57cec5SDimitry Andric //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric
9*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
10*0b57cec5SDimitry Andric
11*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/Hash.h"
12*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/RawError.h"
13*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
14*0b57cec5SDimitry Andric #include "llvm/Support/BinaryStreamReader.h"
15*0b57cec5SDimitry Andric #include "llvm/Support/Endian.h"
16*0b57cec5SDimitry Andric
17*0b57cec5SDimitry Andric using namespace llvm;
18*0b57cec5SDimitry Andric using namespace llvm::support;
19*0b57cec5SDimitry Andric using namespace llvm::pdb;
20*0b57cec5SDimitry Andric
getByteSize() const21*0b57cec5SDimitry Andric uint32_t PDBStringTable::getByteSize() const { return Header->ByteSize; }
getNameCount() const22*0b57cec5SDimitry Andric uint32_t PDBStringTable::getNameCount() const { return NameCount; }
getHashVersion() const23*0b57cec5SDimitry Andric uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
getSignature() const24*0b57cec5SDimitry Andric uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
25*0b57cec5SDimitry Andric
readHeader(BinaryStreamReader & Reader)26*0b57cec5SDimitry Andric Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
27*0b57cec5SDimitry Andric if (auto EC = Reader.readObject(Header))
28*0b57cec5SDimitry Andric return EC;
29*0b57cec5SDimitry Andric
30*0b57cec5SDimitry Andric if (Header->Signature != PDBStringTableSignature)
31*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::corrupt_file,
32*0b57cec5SDimitry Andric "Invalid hash table signature");
33*0b57cec5SDimitry Andric if (Header->HashVersion != 1 && Header->HashVersion != 2)
34*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::corrupt_file,
35*0b57cec5SDimitry Andric "Unsupported hash version");
36*0b57cec5SDimitry Andric
37*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
38*0b57cec5SDimitry Andric return Error::success();
39*0b57cec5SDimitry Andric }
40*0b57cec5SDimitry Andric
readStrings(BinaryStreamReader & Reader)41*0b57cec5SDimitry Andric Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
42*0b57cec5SDimitry Andric BinaryStreamRef Stream;
43*0b57cec5SDimitry Andric if (auto EC = Reader.readStreamRef(Stream))
44*0b57cec5SDimitry Andric return EC;
45*0b57cec5SDimitry Andric
46*0b57cec5SDimitry Andric if (auto EC = Strings.initialize(Stream)) {
47*0b57cec5SDimitry Andric return joinErrors(std::move(EC),
48*0b57cec5SDimitry Andric make_error<RawError>(raw_error_code::corrupt_file,
49*0b57cec5SDimitry Andric "Invalid hash table byte length"));
50*0b57cec5SDimitry Andric }
51*0b57cec5SDimitry Andric
52*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
53*0b57cec5SDimitry Andric return Error::success();
54*0b57cec5SDimitry Andric }
55*0b57cec5SDimitry Andric
56*0b57cec5SDimitry Andric const codeview::DebugStringTableSubsectionRef &
getStringTable() const57*0b57cec5SDimitry Andric PDBStringTable::getStringTable() const {
58*0b57cec5SDimitry Andric return Strings;
59*0b57cec5SDimitry Andric }
60*0b57cec5SDimitry Andric
readHashTable(BinaryStreamReader & Reader)61*0b57cec5SDimitry Andric Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
62*0b57cec5SDimitry Andric const support::ulittle32_t *HashCount;
63*0b57cec5SDimitry Andric if (auto EC = Reader.readObject(HashCount))
64*0b57cec5SDimitry Andric return EC;
65*0b57cec5SDimitry Andric
66*0b57cec5SDimitry Andric if (auto EC = Reader.readArray(IDs, *HashCount)) {
67*0b57cec5SDimitry Andric return joinErrors(std::move(EC),
68*0b57cec5SDimitry Andric make_error<RawError>(raw_error_code::corrupt_file,
69*0b57cec5SDimitry Andric "Could not read bucket array"));
70*0b57cec5SDimitry Andric }
71*0b57cec5SDimitry Andric
72*0b57cec5SDimitry Andric return Error::success();
73*0b57cec5SDimitry Andric }
74*0b57cec5SDimitry Andric
readEpilogue(BinaryStreamReader & Reader)75*0b57cec5SDimitry Andric Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
76*0b57cec5SDimitry Andric if (auto EC = Reader.readInteger(NameCount))
77*0b57cec5SDimitry Andric return EC;
78*0b57cec5SDimitry Andric
79*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
80*0b57cec5SDimitry Andric return Error::success();
81*0b57cec5SDimitry Andric }
82*0b57cec5SDimitry Andric
reload(BinaryStreamReader & Reader)83*0b57cec5SDimitry Andric Error PDBStringTable::reload(BinaryStreamReader &Reader) {
84*0b57cec5SDimitry Andric
85*0b57cec5SDimitry Andric BinaryStreamReader SectionReader;
86*0b57cec5SDimitry Andric
87*0b57cec5SDimitry Andric std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
88*0b57cec5SDimitry Andric if (auto EC = readHeader(SectionReader))
89*0b57cec5SDimitry Andric return EC;
90*0b57cec5SDimitry Andric
91*0b57cec5SDimitry Andric std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
92*0b57cec5SDimitry Andric if (auto EC = readStrings(SectionReader))
93*0b57cec5SDimitry Andric return EC;
94*0b57cec5SDimitry Andric
95*0b57cec5SDimitry Andric // We don't know how long the hash table is until we parse it, so let the
96*0b57cec5SDimitry Andric // function responsible for doing that figure it out.
97*0b57cec5SDimitry Andric if (auto EC = readHashTable(Reader))
98*0b57cec5SDimitry Andric return EC;
99*0b57cec5SDimitry Andric
100*0b57cec5SDimitry Andric std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
101*0b57cec5SDimitry Andric if (auto EC = readEpilogue(SectionReader))
102*0b57cec5SDimitry Andric return EC;
103*0b57cec5SDimitry Andric
104*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
105*0b57cec5SDimitry Andric return Error::success();
106*0b57cec5SDimitry Andric }
107*0b57cec5SDimitry Andric
getStringForID(uint32_t ID) const108*0b57cec5SDimitry Andric Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
109*0b57cec5SDimitry Andric return Strings.getString(ID);
110*0b57cec5SDimitry Andric }
111*0b57cec5SDimitry Andric
getIDForString(StringRef Str) const112*0b57cec5SDimitry Andric Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
113*0b57cec5SDimitry Andric uint32_t Hash =
114*0b57cec5SDimitry Andric (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
115*0b57cec5SDimitry Andric size_t Count = IDs.size();
116*0b57cec5SDimitry Andric uint32_t Start = Hash % Count;
117*0b57cec5SDimitry Andric for (size_t I = 0; I < Count; ++I) {
118*0b57cec5SDimitry Andric // The hash is just a starting point for the search, but if it
119*0b57cec5SDimitry Andric // doesn't work we should find the string no matter what, because
120*0b57cec5SDimitry Andric // we iterate the entire array.
121*0b57cec5SDimitry Andric uint32_t Index = (Start + I) % Count;
122*0b57cec5SDimitry Andric
123*0b57cec5SDimitry Andric // If we find 0, it means the item isn't in the hash table.
124*0b57cec5SDimitry Andric uint32_t ID = IDs[Index];
125*0b57cec5SDimitry Andric if (ID == 0)
126*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::no_entry);
127*0b57cec5SDimitry Andric auto ExpectedStr = getStringForID(ID);
128*0b57cec5SDimitry Andric if (!ExpectedStr)
129*0b57cec5SDimitry Andric return ExpectedStr.takeError();
130*0b57cec5SDimitry Andric
131*0b57cec5SDimitry Andric if (*ExpectedStr == Str)
132*0b57cec5SDimitry Andric return ID;
133*0b57cec5SDimitry Andric }
134*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::no_entry);
135*0b57cec5SDimitry Andric }
136*0b57cec5SDimitry Andric
name_ids() const137*0b57cec5SDimitry Andric FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
138*0b57cec5SDimitry Andric return IDs;
139*0b57cec5SDimitry Andric }
140