blob: 426efb8fd88bc890c26d34c0aaecea71cd194571 [file] [log] [blame]
Rui Ueyama1f6b6e22016-05-13 21:21:53 +00001//===- PublicsStream.cpp - PDB Public Symbol Stream -----------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// The data structures defined in this file are based on the reference
11// implementation which is available at
12// https://github.com/Microsoft/microsoft-pdb/blob/master/PDB/dbi/gsi.h
13//
14// When you are reading the reference source code, you'd find the
15// information below useful.
16//
17// - ppdb1->m_fMinimalDbgInfo seems to be always true.
18// - SMALLBUCKETS macro is defined.
19//
20// The reference doesn't compile, so I learned just by reading code.
21// It's not guaranteed to be correct.
22//
23//===----------------------------------------------------------------------===//
24
25#include "llvm/DebugInfo/PDB/Raw/PublicsStream.h"
26
27#include "llvm/DebugInfo/CodeView/CodeView.h"
28#include "llvm/DebugInfo/CodeView/TypeRecord.h"
Zachary Turnerbac69d32016-07-22 19:56:05 +000029#include "llvm/DebugInfo/Msf/IndexedStreamData.h"
30#include "llvm/DebugInfo/Msf/MappedBlockStream.h"
31#include "llvm/DebugInfo/Msf/StreamReader.h"
Rui Ueyama0fcd8262016-05-20 19:55:17 +000032#include "llvm/DebugInfo/PDB/Raw/PDBFile.h"
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000033#include "llvm/DebugInfo/PDB/Raw/RawConstants.h"
34#include "llvm/DebugInfo/PDB/Raw/RawError.h"
Rui Ueyama0fcd8262016-05-20 19:55:17 +000035#include "llvm/DebugInfo/PDB/Raw/SymbolStream.h"
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000036
37#include "llvm/ADT/BitVector.h"
38#include "llvm/Support/Endian.h"
39#include "llvm/Support/Format.h"
40#include "llvm/Support/MathExtras.h"
41
42using namespace llvm;
Zachary Turnerbac69d32016-07-22 19:56:05 +000043using namespace llvm::msf;
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000044using namespace llvm::support;
45using namespace llvm::pdb;
46
47
48static const unsigned IPHR_HASH = 4096;
49
50// This is PSGSIHDR struct defined in
51// https://github.com/Microsoft/microsoft-pdb/blob/master/PDB/dbi/gsi.h
52struct PublicsStream::HeaderInfo {
53 ulittle32_t SymHash;
54 ulittle32_t AddrMap;
55 ulittle32_t NumThunks;
56 ulittle32_t SizeOfThunk;
57 ulittle16_t ISectThunkTable;
58 char Padding[2];
59 ulittle32_t OffThunkTable;
Rui Ueyama8dc18c52016-05-17 23:07:48 +000060 ulittle32_t NumSections;
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000061};
62
Rui Ueyama0fcd8262016-05-20 19:55:17 +000063// This is GSIHashHdr.
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000064struct PublicsStream::GSIHashHeader {
Reid Klecknere1587bc2016-05-19 20:20:22 +000065 enum : unsigned {
66 HdrSignature = ~0U,
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000067 HdrVersion = 0xeffe0000 + 19990810,
68 };
69 ulittle32_t VerSignature;
70 ulittle32_t VerHdr;
71 ulittle32_t HrSize;
72 ulittle32_t NumBuckets;
73};
74
Zachary Turnera1657a92016-06-08 17:26:39 +000075PublicsStream::PublicsStream(PDBFile &File,
76 std::unique_ptr<MappedBlockStream> Stream)
77 : Pdb(File), Stream(std::move(Stream)) {}
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000078
79PublicsStream::~PublicsStream() {}
80
81uint32_t PublicsStream::getSymHash() const { return Header->SymHash; }
82uint32_t PublicsStream::getAddrMap() const { return Header->AddrMap; }
83
84// Publics stream contains fixed-size headers and a serialized hash table.
85// This implementation is not complete yet. It reads till the end of the
86// stream so that we verify the stream is at least not corrupted. However,
87// we skip over the hash table which we believe contains information about
88// public symbols.
89Error PublicsStream::reload() {
Zachary Turnerbac69d32016-07-22 19:56:05 +000090 StreamReader Reader(*Stream);
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000091
92 // Check stream size.
93 if (Reader.bytesRemaining() < sizeof(HeaderInfo) + sizeof(GSIHashHeader))
94 return make_error<RawError>(raw_error_code::corrupt_file,
95 "Publics Stream does not contain a header.");
96
97 // Read PSGSIHDR and GSIHashHdr structs.
Zachary Turner8dbe3622016-05-27 01:54:44 +000098 if (Reader.readObject(Header))
Rui Ueyama1f6b6e22016-05-13 21:21:53 +000099 return make_error<RawError>(raw_error_code::corrupt_file,
100 "Publics Stream does not contain a header.");
Zachary Turner8dbe3622016-05-27 01:54:44 +0000101
102 if (Reader.readObject(HashHdr))
Rui Ueyama1f6b6e22016-05-13 21:21:53 +0000103 return make_error<RawError>(raw_error_code::corrupt_file,
104 "Publics Stream does not contain a header.");
105
Rui Ueyama0fcd8262016-05-20 19:55:17 +0000106 // An array of HashRecord follows. Read them.
Zachary Turnerb393d952016-05-27 03:51:53 +0000107 if (HashHdr->HrSize % sizeof(PSHashRecord))
Rui Ueyama1f6b6e22016-05-13 21:21:53 +0000108 return make_error<RawError>(raw_error_code::corrupt_file,
109 "Invalid HR array size.");
Zachary Turnerb393d952016-05-27 03:51:53 +0000110 uint32_t NumHashRecords = HashHdr->HrSize / sizeof(PSHashRecord);
111 if (auto EC = Reader.readArray(HashRecords, NumHashRecords))
David Majnemer836937e2016-05-27 16:16:56 +0000112 return joinErrors(std::move(EC),
113 make_error<RawError>(raw_error_code::corrupt_file,
114 "Could not read an HR array"));
Rui Ueyama1f6b6e22016-05-13 21:21:53 +0000115
116 // A bitmap of a fixed length follows.
117 size_t BitmapSizeInBits = alignTo(IPHR_HASH + 1, 32);
Zachary Turnerb393d952016-05-27 03:51:53 +0000118 uint32_t NumBitmapEntries = BitmapSizeInBits / 8;
Zachary Turner0d43c1c2016-05-28 05:21:57 +0000119 if (auto EC = Reader.readBytes(Bitmap, NumBitmapEntries))
David Majnemer836937e2016-05-27 16:16:56 +0000120 return joinErrors(std::move(EC),
121 make_error<RawError>(raw_error_code::corrupt_file,
122 "Could not read a bitmap."));
Rui Ueyama1f6b6e22016-05-13 21:21:53 +0000123 for (uint8_t B : Bitmap)
124 NumBuckets += countPopulation(B);
125
Rui Ueyama8dc18c52016-05-17 23:07:48 +0000126 // We don't yet understand the following data structures completely,
127 // but we at least know the types and sizes. Here we are trying
128 // to read the stream till end so that we at least can detect
129 // corrupted streams.
130
131 // Hash buckets follow.
Zachary Turnerb393d952016-05-27 03:51:53 +0000132 if (auto EC = Reader.readArray(HashBuckets, NumBuckets))
David Majnemer836937e2016-05-27 16:16:56 +0000133 return joinErrors(std::move(EC),
134 make_error<RawError>(raw_error_code::corrupt_file,
135 "Hash buckets corrupted."));
Rui Ueyama1f6b6e22016-05-13 21:21:53 +0000136
Rui Ueyama8dc18c52016-05-17 23:07:48 +0000137 // Something called "address map" follows.
Zachary Turnerb393d952016-05-27 03:51:53 +0000138 uint32_t NumAddressMapEntries = Header->AddrMap / sizeof(uint32_t);
139 if (auto EC = Reader.readArray(AddressMap, NumAddressMapEntries))
David Majnemer836937e2016-05-27 16:16:56 +0000140 return joinErrors(std::move(EC),
141 make_error<RawError>(raw_error_code::corrupt_file,
142 "Could not read an address map."));
Rui Ueyama8dc18c52016-05-17 23:07:48 +0000143
144 // Something called "thunk map" follows.
Zachary Turnerb393d952016-05-27 03:51:53 +0000145 if (auto EC = Reader.readArray(ThunkMap, Header->NumThunks))
David Majnemer836937e2016-05-27 16:16:56 +0000146 return joinErrors(std::move(EC),
147 make_error<RawError>(raw_error_code::corrupt_file,
148 "Could not read a thunk map."));
Rui Ueyama8dc18c52016-05-17 23:07:48 +0000149
150 // Something called "section map" follows.
Zachary Turnerb393d952016-05-27 03:51:53 +0000151 if (auto EC = Reader.readArray(SectionOffsets, Header->NumSections))
David Majnemer836937e2016-05-27 16:16:56 +0000152 return joinErrors(std::move(EC),
153 make_error<RawError>(raw_error_code::corrupt_file,
154 "Could not read a section map."));
Rui Ueyama8dc18c52016-05-17 23:07:48 +0000155
156 if (Reader.bytesRemaining() > 0)
157 return make_error<RawError>(raw_error_code::corrupt_file,
158 "Corrupted publics stream.");
Rui Ueyama1f6b6e22016-05-13 21:21:53 +0000159 return Error::success();
160}
Rui Ueyama0fcd8262016-05-20 19:55:17 +0000161
Zachary Turner0d43c1c2016-05-28 05:21:57 +0000162iterator_range<codeview::CVSymbolArray::Iterator>
163PublicsStream::getSymbols(bool *HadError) const {
Rui Ueyama0fcd8262016-05-20 19:55:17 +0000164 auto SymbolS = Pdb.getPDBSymbolStream();
Zachary Turner9e33e6f2016-05-24 18:55:14 +0000165 if (SymbolS.takeError()) {
Zachary Turner0d43c1c2016-05-28 05:21:57 +0000166 codeview::CVSymbolArray::Iterator Iter;
167 return llvm::make_range(Iter, Iter);
Zachary Turner9e33e6f2016-05-24 18:55:14 +0000168 }
Rui Ueyama0fcd8262016-05-20 19:55:17 +0000169 SymbolStream &SS = SymbolS.get();
170
Zachary Turner0d43c1c2016-05-28 05:21:57 +0000171 return SS.getSymbols(HadError);
Rui Ueyama0fcd8262016-05-20 19:55:17 +0000172}
Zachary Turner8848a7a2016-07-06 18:05:57 +0000173
174Error PublicsStream::commit() { return Error::success(); }