1 //===- PDBStringTableBuilder.cpp - PDB String Table -------------*- C++ -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 #include "llvm/DebugInfo/PDB/Native/PDBStringTableBuilder.h"
12 #include "llvm/ADT/ArrayRef.h"
13 #include "llvm/DebugInfo/PDB/Native/Hash.h"
14 #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
15 #include "llvm/Support/BinaryStreamWriter.h"
16 #include "llvm/Support/Endian.h"
19 using namespace llvm::msf;
20 using namespace llvm::support;
21 using namespace llvm::support::endian;
22 using namespace llvm::pdb;
24 uint32_t PDBStringTableBuilder::insert(StringRef S) {
25 return Strings.insert(S);
28 static uint32_t computeBucketCount(uint32_t NumStrings) {
29 // The /names stream is basically an on-disk open-addressing hash table.
30 // Hash collisions are resolved by linear probing. We cannot make
31 // utilization 100% because it will make the linear probing extremely
32 // slow. But lower utilization wastes disk space. As a reasonable
33 // load factor, we choose 80%. We need +1 because slot 0 is reserved.
34 return (NumStrings + 1) * 1.25;
37 uint32_t PDBStringTableBuilder::calculateHashTableSize() const {
38 uint32_t Size = sizeof(uint32_t); // Hash table begins with 4-byte size field.
39 Size += sizeof(uint32_t) * computeBucketCount(Strings.size());
44 uint32_t PDBStringTableBuilder::calculateSerializedSize() const {
46 Size += sizeof(PDBStringTableHeader);
47 Size += Strings.calculateSerializedSize();
48 Size += calculateHashTableSize();
49 Size += sizeof(uint32_t); // The /names stream ends with the string count.
53 void PDBStringTableBuilder::setStrings(
54 const codeview::DebugStringTableSubsection &Strings) {
55 this->Strings = Strings;
58 Error PDBStringTableBuilder::writeHeader(BinaryStreamWriter &Writer) const {
60 PDBStringTableHeader H;
61 H.Signature = PDBStringTableSignature;
63 H.ByteSize = Strings.calculateSerializedSize();
64 if (auto EC = Writer.writeObject(H))
66 assert(Writer.bytesRemaining() == 0);
67 return Error::success();
70 Error PDBStringTableBuilder::writeStrings(BinaryStreamWriter &Writer) const {
71 if (auto EC = Strings.commit(Writer))
74 assert(Writer.bytesRemaining() == 0);
75 return Error::success();
78 Error PDBStringTableBuilder::writeHashTable(BinaryStreamWriter &Writer) const {
79 // Write a hash table.
80 uint32_t BucketCount = computeBucketCount(Strings.size());
81 if (auto EC = Writer.writeInteger(BucketCount))
83 std::vector<ulittle32_t> Buckets(BucketCount);
85 for (auto &Pair : Strings) {
86 StringRef S = Pair.getKey();
87 uint32_t Offset = Pair.getValue();
88 uint32_t Hash = hashStringV1(S);
90 for (uint32_t I = 0; I != BucketCount; ++I) {
91 uint32_t Slot = (Hash + I) % BucketCount;
93 continue; // Skip reserved slot
94 if (Buckets[Slot] != 0)
96 Buckets[Slot] = Offset;
101 if (auto EC = Writer.writeArray(ArrayRef<ulittle32_t>(Buckets)))
104 assert(Writer.bytesRemaining() == 0);
105 return Error::success();
108 Error PDBStringTableBuilder::writeEpilogue(BinaryStreamWriter &Writer) const {
109 if (auto EC = Writer.writeInteger<uint32_t>(Strings.size()))
111 assert(Writer.bytesRemaining() == 0);
112 return Error::success();
115 Error PDBStringTableBuilder::commit(BinaryStreamWriter &Writer) const {
116 BinaryStreamWriter SectionWriter;
118 std::tie(SectionWriter, Writer) = Writer.split(sizeof(PDBStringTableHeader));
119 if (auto EC = writeHeader(SectionWriter))
122 std::tie(SectionWriter, Writer) =
123 Writer.split(Strings.calculateSerializedSize());
124 if (auto EC = writeStrings(SectionWriter))
127 std::tie(SectionWriter, Writer) = Writer.split(calculateHashTableSize());
128 if (auto EC = writeHashTable(SectionWriter))
131 std::tie(SectionWriter, Writer) = Writer.split(sizeof(uint32_t));
132 if (auto EC = writeEpilogue(SectionWriter))
135 return Error::success();