1 //===- DbiStream.cpp - PDB Dbi Stream (Stream 3) Access -------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "llvm/DebugInfo/PDB/Raw/DbiStream.h"
11 
12 #include "llvm/DebugInfo/CodeView/StreamArray.h"
13 #include "llvm/DebugInfo/CodeView/StreamReader.h"
14 #include "llvm/DebugInfo/CodeView/StreamWriter.h"
15 #include "llvm/DebugInfo/PDB/Raw/ISectionContribVisitor.h"
16 #include "llvm/DebugInfo/PDB/Raw/IndexedStreamData.h"
17 #include "llvm/DebugInfo/PDB/Raw/InfoStream.h"
18 #include "llvm/DebugInfo/PDB/Raw/ModInfo.h"
19 #include "llvm/DebugInfo/PDB/Raw/NameHashTable.h"
20 #include "llvm/DebugInfo/PDB/Raw/PDBFile.h"
21 #include "llvm/DebugInfo/PDB/Raw/RawConstants.h"
22 #include "llvm/DebugInfo/PDB/Raw/RawError.h"
23 #include "llvm/DebugInfo/PDB/Raw/RawTypes.h"
24 #include "llvm/Object/COFF.h"
25 
26 using namespace llvm;
27 using namespace llvm::codeview;
28 using namespace llvm::pdb;
29 using namespace llvm::support;
30 
31 namespace {
32 // Some of the values are stored in bitfields.  Since this needs to be portable
33 // across compilers and architectures (big / little endian in particular) we
34 // can't use the actual structures below, but must instead do the shifting
35 // and masking ourselves.  The struct definitions are provided for reference.
36 
37 // struct DbiFlags {
38 //  uint16_t IncrementalLinking : 1;  // True if linked incrementally
39 //  uint16_t IsStripped : 1;          // True if private symbols were stripped.
40 //  uint16_t HasCTypes : 1;           // True if linked with /debug:ctypes.
41 //  uint16_t Reserved : 13;
42 //};
43 const uint16_t FlagIncrementalMask = 0x0001;
44 const uint16_t FlagStrippedMask = 0x0002;
45 const uint16_t FlagHasCTypesMask = 0x0004;
46 
47 // struct DbiBuildNo {
48 //  uint16_t MinorVersion : 8;
49 //  uint16_t MajorVersion : 7;
50 //  uint16_t NewVersionFormat : 1;
51 //};
52 const uint16_t BuildMinorMask = 0x00FF;
53 const uint16_t BuildMinorShift = 0;
54 
55 const uint16_t BuildMajorMask = 0x7F00;
56 const uint16_t BuildMajorShift = 8;
57 
58 struct FileInfoSubstreamHeader {
59   ulittle16_t NumModules;     // Total # of modules, should match number of
60                               // records in the ModuleInfo substream.
61   ulittle16_t NumSourceFiles; // Total # of source files.  This value is not
62                               // accurate because PDB actually supports more
63                               // than 64k source files, so we ignore it and
64                               // compute the value from other stream fields.
65 };
66 }
67 
68 template <typename ContribType>
loadSectionContribs(FixedStreamArray<ContribType> & Output,StreamReader & Reader)69 static Error loadSectionContribs(FixedStreamArray<ContribType> &Output,
70                                  StreamReader &Reader) {
71   if (Reader.bytesRemaining() % sizeof(ContribType) != 0)
72     return make_error<RawError>(
73         raw_error_code::corrupt_file,
74         "Invalid number of bytes of section contributions");
75 
76   uint32_t Count = Reader.bytesRemaining() / sizeof(ContribType);
77   if (auto EC = Reader.readArray(Output, Count))
78     return EC;
79   return Error::success();
80 }
81 
DbiStream(PDBFile & File,std::unique_ptr<MappedBlockStream> Stream)82 DbiStream::DbiStream(PDBFile &File, std::unique_ptr<MappedBlockStream> Stream)
83     : Pdb(File), Stream(std::move(Stream)), Header(nullptr) {
84   static_assert(sizeof(HeaderInfo) == 64, "Invalid HeaderInfo size!");
85 }
86 
~DbiStream()87 DbiStream::~DbiStream() {}
88 
reload()89 Error DbiStream::reload() {
90   StreamReader Reader(*Stream);
91 
92   if (Stream->getLength() < sizeof(HeaderInfo))
93     return make_error<RawError>(raw_error_code::corrupt_file,
94                                 "DBI Stream does not contain a header.");
95   if (auto EC = Reader.readObject(Header))
96     return make_error<RawError>(raw_error_code::corrupt_file,
97                                 "DBI Stream does not contain a header.");
98 
99   if (Header->VersionSignature != -1)
100     return make_error<RawError>(raw_error_code::corrupt_file,
101                                 "Invalid DBI version signature.");
102 
103   // Require at least version 7, which should be present in all PDBs
104   // produced in the last decade and allows us to avoid having to
105   // special case all kinds of complicated arcane formats.
106   if (Header->VersionHeader < PdbDbiV70)
107     return make_error<RawError>(raw_error_code::feature_unsupported,
108                                 "Unsupported DBI version.");
109 
110   auto IS = Pdb.getPDBInfoStream();
111   if (!IS)
112     return IS.takeError();
113 
114   if (Header->Age != IS->getAge())
115     return make_error<RawError>(raw_error_code::corrupt_file,
116                                 "DBI Age does not match PDB Age.");
117 
118   if (Stream->getLength() !=
119       sizeof(HeaderInfo) + Header->ModiSubstreamSize +
120           Header->SecContrSubstreamSize + Header->SectionMapSize +
121           Header->FileInfoSize + Header->TypeServerSize +
122           Header->OptionalDbgHdrSize + Header->ECSubstreamSize)
123     return make_error<RawError>(raw_error_code::corrupt_file,
124                                 "DBI Length does not equal sum of substreams.");
125 
126   // Only certain substreams are guaranteed to be aligned.  Validate
127   // them here.
128   if (Header->ModiSubstreamSize % sizeof(uint32_t) != 0)
129     return make_error<RawError>(raw_error_code::corrupt_file,
130                                 "DBI MODI substream not aligned.");
131   if (Header->SecContrSubstreamSize % sizeof(uint32_t) != 0)
132     return make_error<RawError>(
133         raw_error_code::corrupt_file,
134         "DBI section contribution substream not aligned.");
135   if (Header->SectionMapSize % sizeof(uint32_t) != 0)
136     return make_error<RawError>(raw_error_code::corrupt_file,
137                                 "DBI section map substream not aligned.");
138   if (Header->FileInfoSize % sizeof(uint32_t) != 0)
139     return make_error<RawError>(raw_error_code::corrupt_file,
140                                 "DBI file info substream not aligned.");
141   if (Header->TypeServerSize % sizeof(uint32_t) != 0)
142     return make_error<RawError>(raw_error_code::corrupt_file,
143                                 "DBI type server substream not aligned.");
144 
145   // Since each ModInfo in the stream is a variable length, we have to iterate
146   // them to know how many there actually are.
147   VarStreamArray<ModInfo> ModInfoArray;
148   if (auto EC = Reader.readArray(ModInfoArray, Header->ModiSubstreamSize))
149     return EC;
150   for (auto &Info : ModInfoArray) {
151     ModuleInfos.emplace_back(Info);
152   }
153 
154   if (auto EC = Reader.readStreamRef(SecContrSubstream,
155                                      Header->SecContrSubstreamSize))
156     return EC;
157   if (auto EC = Reader.readStreamRef(SecMapSubstream, Header->SectionMapSize))
158     return EC;
159   if (auto EC = Reader.readStreamRef(FileInfoSubstream, Header->FileInfoSize))
160     return EC;
161   if (auto EC =
162           Reader.readStreamRef(TypeServerMapSubstream, Header->TypeServerSize))
163     return EC;
164   if (auto EC = Reader.readStreamRef(ECSubstream, Header->ECSubstreamSize))
165     return EC;
166   if (auto EC = Reader.readArray(DbgStreams, Header->OptionalDbgHdrSize /
167                                                  sizeof(ulittle16_t)))
168     return EC;
169 
170   if (auto EC = initializeSectionContributionData())
171     return EC;
172   if (auto EC = initializeSectionHeadersData())
173     return EC;
174   if (auto EC = initializeSectionMapData())
175     return EC;
176   if (auto EC = initializeFileInfo())
177     return EC;
178   if (auto EC = initializeFpoRecords())
179     return EC;
180 
181   if (Reader.bytesRemaining() > 0)
182     return make_error<RawError>(raw_error_code::corrupt_file,
183                                 "Found unexpected bytes in DBI Stream.");
184 
185   StreamReader ECReader(ECSubstream);
186   if (auto EC = ECNames.load(ECReader))
187     return EC;
188 
189   return Error::success();
190 }
191 
getDbiVersion() const192 PdbRaw_DbiVer DbiStream::getDbiVersion() const {
193   uint32_t Value = Header->VersionHeader;
194   return static_cast<PdbRaw_DbiVer>(Value);
195 }
196 
getAge() const197 uint32_t DbiStream::getAge() const { return Header->Age; }
198 
getPublicSymbolStreamIndex() const199 uint16_t DbiStream::getPublicSymbolStreamIndex() const {
200   return Header->PublicSymbolStreamIndex;
201 }
202 
getGlobalSymbolStreamIndex() const203 uint16_t DbiStream::getGlobalSymbolStreamIndex() const {
204   return Header->GlobalSymbolStreamIndex;
205 }
206 
getFlags() const207 uint16_t DbiStream::getFlags() const { return Header->Flags; }
208 
isIncrementallyLinked() const209 bool DbiStream::isIncrementallyLinked() const {
210   return (Header->Flags & FlagIncrementalMask) != 0;
211 }
212 
hasCTypes() const213 bool DbiStream::hasCTypes() const {
214   return (Header->Flags & FlagHasCTypesMask) != 0;
215 }
216 
isStripped() const217 bool DbiStream::isStripped() const {
218   return (Header->Flags & FlagStrippedMask) != 0;
219 }
220 
getBuildNumber() const221 uint16_t DbiStream::getBuildNumber() const { return Header->BuildNumber; }
222 
getBuildMajorVersion() const223 uint16_t DbiStream::getBuildMajorVersion() const {
224   return (Header->BuildNumber & BuildMajorMask) >> BuildMajorShift;
225 }
226 
getBuildMinorVersion() const227 uint16_t DbiStream::getBuildMinorVersion() const {
228   return (Header->BuildNumber & BuildMinorMask) >> BuildMinorShift;
229 }
230 
getPdbDllRbld() const231 uint16_t DbiStream::getPdbDllRbld() const { return Header->PdbDllRbld; }
232 
getPdbDllVersion() const233 uint32_t DbiStream::getPdbDllVersion() const { return Header->PdbDllVersion; }
234 
getSymRecordStreamIndex() const235 uint32_t DbiStream::getSymRecordStreamIndex() const {
236   return Header->SymRecordStreamIndex;
237 }
238 
getMachineType() const239 PDB_Machine DbiStream::getMachineType() const {
240   uint16_t Machine = Header->MachineType;
241   return static_cast<PDB_Machine>(Machine);
242 }
243 
244 codeview::FixedStreamArray<object::coff_section>
getSectionHeaders()245 DbiStream::getSectionHeaders() {
246   return SectionHeaders;
247 }
248 
getFpoRecords()249 codeview::FixedStreamArray<object::FpoData> DbiStream::getFpoRecords() {
250   return FpoRecords;
251 }
252 
modules() const253 ArrayRef<ModuleInfoEx> DbiStream::modules() const { return ModuleInfos; }
getSectionMap() const254 codeview::FixedStreamArray<SecMapEntry> DbiStream::getSectionMap() const {
255   return SectionMap;
256 }
257 
visitSectionContributions(ISectionContribVisitor & Visitor) const258 void llvm::pdb::DbiStream::visitSectionContributions(
259     ISectionContribVisitor &Visitor) const {
260   if (SectionContribVersion == DbiSecContribVer60) {
261     for (auto &SC : SectionContribs)
262       Visitor.visit(SC);
263   } else if (SectionContribVersion == DbiSecContribV2) {
264     for (auto &SC : SectionContribs2)
265       Visitor.visit(SC);
266   }
267 }
268 
initializeSectionContributionData()269 Error DbiStream::initializeSectionContributionData() {
270   StreamReader SCReader(SecContrSubstream);
271   if (auto EC = SCReader.readEnum(SectionContribVersion))
272     return EC;
273 
274   if (SectionContribVersion == DbiSecContribVer60)
275     return loadSectionContribs<SectionContrib>(SectionContribs, SCReader);
276   if (SectionContribVersion == DbiSecContribV2)
277     return loadSectionContribs<SectionContrib2>(SectionContribs2, SCReader);
278 
279   return make_error<RawError>(raw_error_code::feature_unsupported,
280                               "Unsupported DBI Section Contribution version");
281 }
282 
283 // Initializes this->SectionHeaders.
initializeSectionHeadersData()284 Error DbiStream::initializeSectionHeadersData() {
285   uint32_t StreamNum = getDebugStreamIndex(DbgHeaderType::SectionHdr);
286   if (StreamNum >= Pdb.getNumStreams())
287     return make_error<RawError>(raw_error_code::no_stream);
288 
289   auto SHS = MappedBlockStream::createIndexedStream(StreamNum, Pdb);
290   if (!SHS)
291     return SHS.takeError();
292 
293   size_t StreamLen = (*SHS)->getLength();
294   if (StreamLen % sizeof(object::coff_section))
295     return make_error<RawError>(raw_error_code::corrupt_file,
296                                 "Corrupted section header stream.");
297 
298   size_t NumSections = StreamLen / sizeof(object::coff_section);
299   codeview::StreamReader Reader(**SHS);
300   if (auto EC = Reader.readArray(SectionHeaders, NumSections))
301     return make_error<RawError>(raw_error_code::corrupt_file,
302                                 "Could not read a bitmap.");
303 
304   SectionHeaderStream = std::move(*SHS);
305   return Error::success();
306 }
307 
308 // Initializes this->Fpos.
initializeFpoRecords()309 Error DbiStream::initializeFpoRecords() {
310   uint32_t StreamNum = getDebugStreamIndex(DbgHeaderType::NewFPO);
311 
312   // This means there is no FPO data.
313   if (StreamNum == InvalidStreamIndex)
314     return Error::success();
315 
316   if (StreamNum >= Pdb.getNumStreams())
317     return make_error<RawError>(raw_error_code::no_stream);
318 
319   auto FS = MappedBlockStream::createIndexedStream(StreamNum, Pdb);
320   if (!FS)
321     return FS.takeError();
322 
323   size_t StreamLen = (*FS)->getLength();
324   if (StreamLen % sizeof(object::FpoData))
325     return make_error<RawError>(raw_error_code::corrupt_file,
326                                 "Corrupted New FPO stream.");
327 
328   size_t NumRecords = StreamLen / sizeof(object::FpoData);
329   codeview::StreamReader Reader(**FS);
330   if (auto EC = Reader.readArray(FpoRecords, NumRecords))
331     return make_error<RawError>(raw_error_code::corrupt_file,
332                                 "Corrupted New FPO stream.");
333   FpoStream = std::move(*FS);
334   return Error::success();
335 }
336 
initializeSectionMapData()337 Error DbiStream::initializeSectionMapData() {
338   StreamReader SMReader(SecMapSubstream);
339   const SecMapHeader *Header;
340   if (auto EC = SMReader.readObject(Header))
341     return EC;
342   if (auto EC = SMReader.readArray(SectionMap, Header->SecCount))
343     return EC;
344   return Error::success();
345 }
346 
initializeFileInfo()347 Error DbiStream::initializeFileInfo() {
348   // The layout of the FileInfoSubstream is like this:
349   // struct {
350   //   ulittle16_t NumModules;
351   //   ulittle16_t NumSourceFiles;
352   //   ulittle16_t ModIndices[NumModules];
353   //   ulittle16_t ModFileCounts[NumModules];
354   //   ulittle32_t FileNameOffsets[NumSourceFiles];
355   //   char Names[][NumSourceFiles];
356   // };
357   // with the caveat that `NumSourceFiles` cannot be trusted, so
358   // it is computed by summing `ModFileCounts`.
359   //
360   const FileInfoSubstreamHeader *FH;
361   StreamReader FISR(FileInfoSubstream);
362   if (auto EC = FISR.readObject(FH))
363     return EC;
364 
365   // The number of modules in the stream should be the same as reported by
366   // the FileInfoSubstreamHeader.
367   if (FH->NumModules != ModuleInfos.size())
368     return make_error<RawError>(raw_error_code::corrupt_file,
369                                 "FileInfo substream count doesn't match DBI.");
370 
371   FixedStreamArray<ulittle16_t> ModIndexArray;
372   FixedStreamArray<ulittle16_t> ModFileCountArray;
373 
374   // First is an array of `NumModules` module indices.  This is not used for the
375   // same reason that `NumSourceFiles` is not used.  It's an array of uint16's,
376   // but it's possible there are more than 64k source files, which would imply
377   // more than 64k modules (e.g. object files) as well.  So we ignore this
378   // field.
379   if (auto EC = FISR.readArray(ModIndexArray, ModuleInfos.size()))
380     return EC;
381   if (auto EC = FISR.readArray(ModFileCountArray, ModuleInfos.size()))
382     return EC;
383 
384   // Compute the real number of source files.
385   uint32_t NumSourceFiles = 0;
386   for (auto Count : ModFileCountArray)
387     NumSourceFiles += Count;
388 
389   // This is the array that in the reference implementation corresponds to
390   // `ModInfo::FileLayout::FileNameOffs`, which is commented there as being a
391   // pointer. Due to the mentioned problems of pointers causing difficulty
392   // when reading from the file on 64-bit systems, we continue to ignore that
393   // field in `ModInfo`, and instead build a vector of StringRefs and stores
394   // them in `ModuleInfoEx`.  The value written to and read from the file is
395   // not used anyway, it is only there as a way to store the offsets for the
396   // purposes of later accessing the names at runtime.
397   if (auto EC = FISR.readArray(FileNameOffsets, NumSourceFiles))
398     return EC;
399 
400   if (auto EC = FISR.readStreamRef(NamesBuffer))
401     return EC;
402 
403   // We go through each ModuleInfo, determine the number N of source files for
404   // that module, and then get the next N offsets from the Offsets array, using
405   // them to get the corresponding N names from the Names buffer and associating
406   // each one with the corresponding module.
407   uint32_t NextFileIndex = 0;
408   for (size_t I = 0; I < ModuleInfos.size(); ++I) {
409     uint32_t NumFiles = ModFileCountArray[I];
410     ModuleInfos[I].SourceFiles.resize(NumFiles);
411     for (size_t J = 0; J < NumFiles; ++J, ++NextFileIndex) {
412       auto ThisName = getFileNameForIndex(NextFileIndex);
413       if (!ThisName)
414         return ThisName.takeError();
415       ModuleInfos[I].SourceFiles[J] = *ThisName;
416     }
417   }
418 
419   return Error::success();
420 }
421 
getDebugStreamIndex(DbgHeaderType Type) const422 uint32_t DbiStream::getDebugStreamIndex(DbgHeaderType Type) const {
423   return DbgStreams[static_cast<uint16_t>(Type)];
424 }
425 
getFileNameForIndex(uint32_t Index) const426 Expected<StringRef> DbiStream::getFileNameForIndex(uint32_t Index) const {
427   StreamReader Names(NamesBuffer);
428   if (Index >= FileNameOffsets.size())
429     return make_error<RawError>(raw_error_code::index_out_of_bounds);
430 
431   uint32_t FileOffset = FileNameOffsets[Index];
432   Names.setOffset(FileOffset);
433   StringRef Name;
434   if (auto EC = Names.readZeroString(Name))
435     return std::move(EC);
436   return Name;
437 }
438 
commit()439 Error DbiStream::commit() { return Error::success(); }
440