//===- PublicsStream.cpp - PDB Public Symbol Stream -----------------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // The data structures defined in this file are based on the reference // implementation which is available at // https://github.com/Microsoft/microsoft-pdb/blob/master/PDB/dbi/gsi.h // // When you are reading the reference source code, you'd find the // information below useful. // // - ppdb1->m_fMinimalDbgInfo seems to be always true. // - SMALLBUCKETS macro is defined. // // The reference doesn't compile, so I learned just by reading code. // It's not guaranteed to be correct. // //===----------------------------------------------------------------------===// #include "llvm/DebugInfo/PDB/Raw/PublicsStream.h" #include "llvm/DebugInfo/CodeView/CodeView.h" #include "llvm/DebugInfo/CodeView/StreamReader.h" #include "llvm/DebugInfo/CodeView/TypeRecord.h" #include "llvm/DebugInfo/PDB/Raw/IndexedStreamData.h" #include "llvm/DebugInfo/PDB/Raw/MappedBlockStream.h" #include "llvm/DebugInfo/PDB/Raw/PDBFile.h" #include "llvm/DebugInfo/PDB/Raw/RawConstants.h" #include "llvm/DebugInfo/PDB/Raw/RawError.h" #include "llvm/DebugInfo/PDB/Raw/SymbolStream.h" #include "llvm/ADT/BitVector.h" #include "llvm/Support/Endian.h" #include "llvm/Support/Format.h" #include "llvm/Support/MathExtras.h" using namespace llvm; using namespace llvm::support; using namespace llvm::pdb; static const unsigned IPHR_HASH = 4096; // This is PSGSIHDR struct defined in // https://github.com/Microsoft/microsoft-pdb/blob/master/PDB/dbi/gsi.h struct PublicsStream::HeaderInfo { ulittle32_t SymHash; ulittle32_t AddrMap; ulittle32_t NumThunks; ulittle32_t SizeOfThunk; ulittle16_t ISectThunkTable; char Padding[2]; ulittle32_t OffThunkTable; ulittle32_t NumSections; }; // This is GSIHashHdr. struct PublicsStream::GSIHashHeader { enum : unsigned { HdrSignature = ~0U, HdrVersion = 0xeffe0000 + 19990810, }; ulittle32_t VerSignature; ulittle32_t VerHdr; ulittle32_t HrSize; ulittle32_t NumBuckets; }; PublicsStream::PublicsStream(PDBFile &File, std::unique_ptr<MappedBlockStream> Stream) : Pdb(File), Stream(std::move(Stream)) {} PublicsStream::~PublicsStream() {} uint32_t PublicsStream::getSymHash() const { return Header->SymHash; } uint32_t PublicsStream::getAddrMap() const { return Header->AddrMap; } // Publics stream contains fixed-size headers and a serialized hash table. // This implementation is not complete yet. It reads till the end of the // stream so that we verify the stream is at least not corrupted. However, // we skip over the hash table which we believe contains information about // public symbols. Error PublicsStream::reload() { codeview::StreamReader Reader(*Stream); // Check stream size. if (Reader.bytesRemaining() < sizeof(HeaderInfo) + sizeof(GSIHashHeader)) return make_error<RawError>(raw_error_code::corrupt_file, "Publics Stream does not contain a header."); // Read PSGSIHDR and GSIHashHdr structs. if (Reader.readObject(Header)) return make_error<RawError>(raw_error_code::corrupt_file, "Publics Stream does not contain a header."); if (Reader.readObject(HashHdr)) return make_error<RawError>(raw_error_code::corrupt_file, "Publics Stream does not contain a header."); // An array of HashRecord follows. Read them. if (HashHdr->HrSize % sizeof(PSHashRecord)) return make_error<RawError>(raw_error_code::corrupt_file, "Invalid HR array size."); uint32_t NumHashRecords = HashHdr->HrSize / sizeof(PSHashRecord); if (auto EC = Reader.readArray(HashRecords, NumHashRecords)) return joinErrors(std::move(EC), make_error<RawError>(raw_error_code::corrupt_file, "Could not read an HR array")); // A bitmap of a fixed length follows. size_t BitmapSizeInBits = alignTo(IPHR_HASH + 1, 32); uint32_t NumBitmapEntries = BitmapSizeInBits / 8; if (auto EC = Reader.readBytes(Bitmap, NumBitmapEntries)) return joinErrors(std::move(EC), make_error<RawError>(raw_error_code::corrupt_file, "Could not read a bitmap.")); for (uint8_t B : Bitmap) NumBuckets += countPopulation(B); // We don't yet understand the following data structures completely, // but we at least know the types and sizes. Here we are trying // to read the stream till end so that we at least can detect // corrupted streams. // Hash buckets follow. if (auto EC = Reader.readArray(HashBuckets, NumBuckets)) return joinErrors(std::move(EC), make_error<RawError>(raw_error_code::corrupt_file, "Hash buckets corrupted.")); // Something called "address map" follows. uint32_t NumAddressMapEntries = Header->AddrMap / sizeof(uint32_t); if (auto EC = Reader.readArray(AddressMap, NumAddressMapEntries)) return joinErrors(std::move(EC), make_error<RawError>(raw_error_code::corrupt_file, "Could not read an address map.")); // Something called "thunk map" follows. if (auto EC = Reader.readArray(ThunkMap, Header->NumThunks)) return joinErrors(std::move(EC), make_error<RawError>(raw_error_code::corrupt_file, "Could not read a thunk map.")); // Something called "section map" follows. if (auto EC = Reader.readArray(SectionOffsets, Header->NumSections)) return joinErrors(std::move(EC), make_error<RawError>(raw_error_code::corrupt_file, "Could not read a section map.")); if (Reader.bytesRemaining() > 0) return make_error<RawError>(raw_error_code::corrupt_file, "Corrupted publics stream."); return Error::success(); } iterator_range<codeview::CVSymbolArray::Iterator> PublicsStream::getSymbols(bool *HadError) const { auto SymbolS = Pdb.getPDBSymbolStream(); if (SymbolS.takeError()) { codeview::CVSymbolArray::Iterator Iter; return llvm::make_range(Iter, Iter); } SymbolStream &SS = SymbolS.get(); return SS.getSymbols(HadError); } Error PublicsStream::commit() { return Error::success(); }