LLVM 20.0.0git
PDBFileBuilder.cpp
Go to the documentation of this file.
1//===- PDBFileBuilder.cpp - PDB File Creation -------------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
26#include "llvm/Support/CRC.h"
27#include "llvm/Support/Path.h"
29#include "llvm/Support/xxhash.h"
30
31#include <ctime>
32
33using namespace llvm;
34using namespace llvm::codeview;
35using namespace llvm::msf;
36using namespace llvm::pdb;
37using namespace llvm::support;
38
39namespace llvm {
41}
42
44 : Allocator(Allocator), InjectedSourceHashTraits(Strings),
45 InjectedSourceTable(2) {}
46
48
50 auto ExpectedMsf = MSFBuilder::create(Allocator, BlockSize);
51 if (!ExpectedMsf)
52 return ExpectedMsf.takeError();
53 Msf = std::make_unique<MSFBuilder>(std::move(*ExpectedMsf));
54 return Error::success();
55}
56
58
60 if (!Info)
61 Info = std::make_unique<InfoStreamBuilder>(*Msf, NamedStreams);
62 return *Info;
63}
64
66 if (!Dbi)
67 Dbi = std::make_unique<DbiStreamBuilder>(*Msf);
68 return *Dbi;
69}
70
72 if (!Tpi)
73 Tpi = std::make_unique<TpiStreamBuilder>(*Msf, StreamTPI);
74 return *Tpi;
75}
76
78 if (!Ipi)
79 Ipi = std::make_unique<TpiStreamBuilder>(*Msf, StreamIPI);
80 return *Ipi;
81}
82
84 return Strings;
85}
86
88 if (!Gsi)
89 Gsi = std::make_unique<GSIStreamBuilder>(*Msf);
90 return *Gsi;
91}
92
93Expected<uint32_t> PDBFileBuilder::allocateNamedStream(StringRef Name,
94 uint32_t Size) {
95 auto ExpectedStream = Msf->addStream(Size);
96 if (ExpectedStream)
97 NamedStreams.set(Name, *ExpectedStream);
98 return ExpectedStream;
99}
100
102 Expected<uint32_t> ExpectedIndex = allocateNamedStream(Name, Data.size());
103 if (!ExpectedIndex)
104 return ExpectedIndex.takeError();
105 assert(NamedStreamData.count(*ExpectedIndex) == 0);
106 NamedStreamData[*ExpectedIndex] = std::string(Data);
107 return Error::success();
108}
109
111 std::unique_ptr<MemoryBuffer> Buffer) {
112 // Stream names must be exact matches, since they get looked up in a hash
113 // table and the hash value is dependent on the exact contents of the string.
114 // link.exe lowercases a path and converts / to \, so we must do the same.
115 SmallString<64> VName;
117
120
121 InjectedSourceDescriptor Desc;
122 Desc.Content = std::move(Buffer);
123 Desc.NameIndex = NI;
124 Desc.VNameIndex = VNI;
125 Desc.StreamName = "/src/files/";
126
127 Desc.StreamName += VName;
128
129 InjectedSources.push_back(std::move(Desc));
130}
131
132Error PDBFileBuilder::finalizeMsfLayout() {
133 llvm::TimeTraceScope timeScope("MSF layout");
134
135 if (Ipi && Ipi->getRecordCount() > 0) {
136 // In theory newer PDBs always have an ID stream, but by saying that we're
137 // only going to *really* have an ID stream if there is at least one ID
138 // record, we leave open the opportunity to test older PDBs such as those
139 // that don't have an ID stream.
140 auto &Info = getInfoBuilder();
141 Info.addFeature(PdbRaw_FeatureSig::VC140);
142 }
143
144 uint32_t StringsLen = Strings.calculateSerializedSize();
145
146 Expected<uint32_t> SN = allocateNamedStream("/LinkInfo", 0);
147 if (!SN)
148 return SN.takeError();
149
150 if (Gsi) {
151 if (auto EC = Gsi->finalizeMsfLayout())
152 return EC;
153 if (Dbi) {
154 Dbi->setPublicsStreamIndex(Gsi->getPublicsStreamIndex());
155 Dbi->setGlobalsStreamIndex(Gsi->getGlobalsStreamIndex());
156 Dbi->setSymbolRecordStreamIndex(Gsi->getRecordStreamIndex());
157 }
158 }
159 if (Tpi) {
160 if (auto EC = Tpi->finalizeMsfLayout())
161 return EC;
162 }
163 if (Dbi) {
164 if (auto EC = Dbi->finalizeMsfLayout())
165 return EC;
166 }
167 SN = allocateNamedStream("/names", StringsLen);
168 if (!SN)
169 return SN.takeError();
170
171 if (Ipi) {
172 if (auto EC = Ipi->finalizeMsfLayout())
173 return EC;
174 }
175
176 // Do this last, since it relies on the named stream map being complete, and
177 // that can be updated by previous steps in the finalization.
178 if (Info) {
179 if (auto EC = Info->finalizeMsfLayout())
180 return EC;
181 }
182
183 if (!InjectedSources.empty()) {
184 for (const auto &IS : InjectedSources) {
185 JamCRC CRC(0);
186 CRC.update(arrayRefFromStringRef(IS.Content->getBuffer()));
187
189 ::memset(&Entry, 0, sizeof(SrcHeaderBlockEntry));
190 Entry.Size = sizeof(SrcHeaderBlockEntry);
191 Entry.FileSize = IS.Content->getBufferSize();
192 Entry.FileNI = IS.NameIndex;
193 Entry.VFileNI = IS.VNameIndex;
194 Entry.ObjNI = 1;
195 Entry.IsVirtual = 0;
196 Entry.Version =
198 Entry.CRC = CRC.getCRC();
199 StringRef VName = getStringTableBuilder().getStringForId(IS.VNameIndex);
200 InjectedSourceTable.set_as(VName, std::move(Entry),
201 InjectedSourceHashTraits);
202 }
203
204 uint32_t SrcHeaderBlockSize =
205 sizeof(SrcHeaderBlockHeader) +
206 InjectedSourceTable.calculateSerializedLength();
207 SN = allocateNamedStream("/src/headerblock", SrcHeaderBlockSize);
208 if (!SN)
209 return SN.takeError();
210 for (const auto &IS : InjectedSources) {
211 SN = allocateNamedStream(IS.StreamName, IS.Content->getBufferSize());
212 if (!SN)
213 return SN.takeError();
214 }
215 }
216
217 // Do this last, since it relies on the named stream map being complete, and
218 // that can be updated by previous steps in the finalization.
219 if (Info) {
220 if (auto EC = Info->finalizeMsfLayout())
221 return EC;
222 }
223
224 return Error::success();
225}
226
228 uint32_t SN = 0;
229 if (!NamedStreams.get(Name, SN))
230 return llvm::make_error<pdb::RawError>(raw_error_code::no_stream);
231 return SN;
232}
233
234void PDBFileBuilder::commitSrcHeaderBlock(WritableBinaryStream &MsfBuffer,
235 const msf::MSFLayout &Layout) {
236 assert(!InjectedSourceTable.empty());
237
238 uint32_t SN = cantFail(getNamedStreamIndex("/src/headerblock"));
240 Layout, MsfBuffer, SN, Allocator);
241 BinaryStreamWriter Writer(*Stream);
242
244 ::memset(&Header, 0, sizeof(Header));
245 Header.Version = static_cast<uint32_t>(PdbRaw_SrcHeaderBlockVer::SrcVerOne);
246 Header.Size = Writer.bytesRemaining();
247
248 cantFail(Writer.writeObject(Header));
249 cantFail(InjectedSourceTable.commit(Writer));
250
251 assert(Writer.bytesRemaining() == 0);
252}
253
254void PDBFileBuilder::commitInjectedSources(WritableBinaryStream &MsfBuffer,
255 const msf::MSFLayout &Layout) {
256 if (InjectedSourceTable.empty())
257 return;
258
259 llvm::TimeTraceScope timeScope("Commit injected sources");
260 commitSrcHeaderBlock(MsfBuffer, Layout);
261
262 for (const auto &IS : InjectedSources) {
263 uint32_t SN = cantFail(getNamedStreamIndex(IS.StreamName));
264
266 Layout, MsfBuffer, SN, Allocator);
267 BinaryStreamWriter SourceWriter(*SourceStream);
268 assert(SourceWriter.bytesRemaining() == IS.Content->getBufferSize());
269 cantFail(SourceWriter.writeBytes(
270 arrayRefFromStringRef(IS.Content->getBuffer())));
271 }
272}
273
275 assert(!Filename.empty());
276 if (auto EC = finalizeMsfLayout())
277 return EC;
278
279 MSFLayout Layout;
280 Expected<FileBufferByteStream> ExpectedMsfBuffer =
281 Msf->commit(Filename, Layout);
282 if (!ExpectedMsfBuffer)
283 return ExpectedMsfBuffer.takeError();
284 FileBufferByteStream Buffer = std::move(*ExpectedMsfBuffer);
285
286 auto ExpectedSN = getNamedStreamIndex("/names");
287 if (!ExpectedSN)
288 return ExpectedSN.takeError();
289
291 Layout, Buffer, *ExpectedSN, Allocator);
292 BinaryStreamWriter NSWriter(*NS);
293 if (auto EC = Strings.commit(NSWriter))
294 return EC;
295
296 {
297 llvm::TimeTraceScope timeScope("Named stream data");
298 for (const auto &NSE : NamedStreamData) {
299 if (NSE.second.empty())
300 continue;
301
303 Layout, Buffer, NSE.first, Allocator);
304 BinaryStreamWriter NSW(*NS);
305 if (auto EC = NSW.writeBytes(arrayRefFromStringRef(NSE.second)))
306 return EC;
307 }
308 }
309
310 if (Info) {
311 if (auto EC = Info->commit(Layout, Buffer))
312 return EC;
313 }
314
315 if (Dbi) {
316 if (auto EC = Dbi->commit(Layout, Buffer))
317 return EC;
318 }
319
320 if (Tpi) {
321 if (auto EC = Tpi->commit(Layout, Buffer))
322 return EC;
323 }
324
325 if (Ipi) {
326 if (auto EC = Ipi->commit(Layout, Buffer))
327 return EC;
328 }
329
330 if (Gsi) {
331 if (auto EC = Gsi->commit(Layout, Buffer))
332 return EC;
333 }
334
335 auto InfoStreamBlocks = Layout.StreamMap[StreamPDB];
336 assert(!InfoStreamBlocks.empty());
337 uint64_t InfoStreamFileOffset =
338 blockToOffset(InfoStreamBlocks.front(), Layout.SB->BlockSize);
339 InfoStreamHeader *H = reinterpret_cast<InfoStreamHeader *>(
340 Buffer.getBufferStart() + InfoStreamFileOffset);
341
342 commitInjectedSources(Buffer, Layout);
343
344 // Set the build id at the very end, after every other byte of the PDB
345 // has been written.
346 if (Info->hashPDBContentsToGUID()) {
347 llvm::TimeTraceScope timeScope("Compute build ID");
348
349 // Compute a hash of all sections of the output file.
350 uint64_t Digest =
351 xxh3_64bits({Buffer.getBufferStart(), Buffer.getBufferEnd()});
352
353 H->Age = 1;
354
355 memcpy(H->Guid.Guid, &Digest, 8);
356 // xxhash only gives us 8 bytes, so put some fixed data in the other half.
357 memcpy(H->Guid.Guid + 8, "LLD PDB.", 8);
358
359 // Put the hash in the Signature field too.
360 H->Signature = static_cast<uint32_t>(Digest);
361
362 // Return GUID to caller.
363 memcpy(Guid, H->Guid.Guid, 16);
364 } else {
365 H->Age = Info->getAge();
366 H->Guid = Info->getGuid();
367 std::optional<uint32_t> Sig = Info->getSignature();
368 H->Signature = Sig ? *Sig : time(nullptr);
369 }
370
371 return Buffer.commit();
372}
Analysis containing CSE Info
Definition: CSEInfo.cpp:27
std::string Name
uint64_t Size
#define H(x, y, z)
Definition: MD5.cpp:57
Basic Register Allocator
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallString class.
This file contains some functions that are useful when dealing with strings.
static const int BlockSize
Definition: TarWriter.cpp:33
Provides write only access to a subclass of WritableBinaryStream.
Error writeBytes(ArrayRef< uint8_t > Buffer)
Write the bytes specified in Buffer to the underlying stream.
Allocate memory in an ever growing pool, as if by bump-pointer.
Definition: Allocator.h:66
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:151
Lightweight error class with error context and mandatory checking.
Definition: Error.h:160
static ErrorSuccess success()
Create a success value.
Definition: Error.h:337
Tagged union holding either a T or a Error.
Definition: Error.h:481
Error takeError()
Take ownership of the stored error.
Definition: Error.h:608
An implementation of WritableBinaryStream backed by an llvm FileOutputBuffer.
Error commit() override
For buffered streams, commits changes to the backing store.
uint8_t * getBufferEnd() const
Returns a pointer to the end of the buffer.
uint8_t * getBufferStart() const
Returns a pointer to the start of the buffer.
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
Definition: SmallString.h:26
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50
The TimeTraceScope is a helper class to call the begin and end functions of the time trace profiler.
Definition: TimeProfiler.h:163
A BinaryStream which can be read from as well as written to.
Definition: BinaryStream.h:72
static Expected< MSFBuilder > create(BumpPtrAllocator &Allocator, uint32_t BlockSize, uint32_t MinBlockCount=0, bool CanGrow=true)
Create a new MSFBuilder.
Definition: MSFBuilder.cpp:51
static std::unique_ptr< WritableMappedBlockStream > createIndexedStream(const MSFLayout &Layout, WritableBinaryStreamRef MsfData, uint32_t StreamIndex, BumpPtrAllocator &Allocator)
bool set_as(const Key &K, ValueT V, TraitsT &Traits)
Set the entry using a key type that the specified Traits can convert from a real key to an internal k...
Definition: HashTable.h:250
Error commit(BinaryStreamWriter &Writer) const
Definition: HashTable.h:180
bool empty() const
Definition: HashTable.h:208
uint32_t calculateSerializedLength() const
Definition: HashTable.h:153
void set(StringRef Stream, uint32_t StreamNo)
bool get(StringRef Stream, uint32_t &StreamNo) const
TpiStreamBuilder & getTpiBuilder()
msf::MSFBuilder & getMsfBuilder()
PDBStringTableBuilder & getStringTableBuilder()
Error addNamedStream(StringRef Name, StringRef Data)
DbiStreamBuilder & getDbiBuilder()
TpiStreamBuilder & getIpiBuilder()
GSIStreamBuilder & getGsiBuilder()
InfoStreamBuilder & getInfoBuilder()
Error initialize(uint32_t BlockSize)
PDBFileBuilder(BumpPtrAllocator &Allocator)
Error commit(StringRef Filename, codeview::GUID *Guid)
void addInjectedSource(StringRef Name, std::unique_ptr< MemoryBuffer > Buffer)
Expected< uint32_t > getNamedStreamIndex(StringRef Name) const
Error commit(BinaryStreamWriter &Writer) const
StringRef getStringForId(uint32_t Id) const
@ Entry
Definition: COFF.h:826
uint64_t blockToOffset(uint64_t BlockNumber, uint64_t BlockSize)
Definition: MSFCommon.h:135
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
uint64_t xxh3_64bits(ArrayRef< uint8_t > data)
Definition: xxhash.cpp:553
Op::Description Desc
void cantFail(Error Err, const char *Msg=nullptr)
Report a fatal error if Err is a failure value.
Definition: Error.h:756
Description of the encoding of one expression Op.
This represents the 'GUID' type from windows.h.
Definition: GUID.h:21
const SuperBlock * SB
Definition: MSFCommon.h:64
std::vector< ArrayRef< support::ulittle32_t > > StreamMap
Definition: MSFCommon.h:68
support::ulittle32_t BlockSize
Definition: MSFCommon.h:36
The header preceding the global PDB Stream (Stream 1)
Definition: RawTypes.h:304
A single file record entry within the /src/headerblock stream.
Definition: RawTypes.h:331
The header preceding the /src/headerblock stream.
Definition: RawTypes.h:321