LLVM 22.0.0git
PublicsStream.cpp
Go to the documentation of this file.
1//===- PublicsStream.cpp - PDB Public Symbol Stream -----------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// The data structures defined in this file are based on the reference
10// implementation which is available at
11// https://github.com/Microsoft/microsoft-pdb/blob/master/PDB/dbi/gsi.h
12//
13// When you are reading the reference source code, you'd find the
14// information below useful.
15//
16// - ppdb1->m_fMinimalDbgInfo seems to be always true.
17// - SMALLBUCKETS macro is defined.
18//
19// The reference doesn't compile, so I learned just by reading code.
20// It's not guaranteed to be correct.
21//
22//===----------------------------------------------------------------------===//
23
32#include "llvm/Support/Error.h"
33#include <cstdint>
34
35using namespace llvm;
36using namespace llvm::msf;
37using namespace llvm::support;
38using namespace llvm::pdb;
39
40PublicsStream::PublicsStream(std::unique_ptr<MappedBlockStream> Stream)
41 : Stream(std::move(Stream)) {}
42
44
45uint32_t PublicsStream::getSymHash() const { return Header->SymHash; }
47 return Header->ISectThunkTable;
48}
50 return Header->OffThunkTable;
51}
52
53// Publics stream contains fixed-size headers and a serialized hash table.
54// This implementation is not complete yet. It reads till the end of the
55// stream so that we verify the stream is at least not corrupted. However,
56// we skip over the hash table which we believe contains information about
57// public symbols.
59 BinaryStreamReader Reader(*Stream);
60
61 // Check stream size.
62 if (Reader.bytesRemaining() <
63 sizeof(PublicsStreamHeader) + sizeof(GSIHashHeader))
65 "Publics Stream does not contain a header.");
66
67 // Read PSGSIHDR struct.
68 if (Reader.readObject(Header))
70 "Publics Stream does not contain a header.");
71
72 // Read the hash table.
73 if (auto E = PublicsTable.read(Reader))
74 return E;
75
76 // Something called "address map" follows.
77 uint32_t NumAddressMapEntries = Header->AddrMap / sizeof(uint32_t);
78 if (auto EC = Reader.readArray(AddressMap, NumAddressMapEntries))
79 return joinErrors(std::move(EC),
81 "Could not read an address map."));
82
83 // Something called "thunk map" follows.
84 if (auto EC = Reader.readArray(ThunkMap, Header->NumThunks))
85 return joinErrors(std::move(EC),
87 "Could not read a thunk map."));
88
89 // Something called "section map" follows.
90 if (Reader.bytesRemaining() > 0) {
91 if (auto EC = Reader.readArray(SectionOffsets, Header->NumSections))
92 return joinErrors(std::move(EC),
94 "Could not read a section map."));
95 }
96
97 if (Reader.bytesRemaining() > 0)
99 "Corrupted publics stream.");
100 return Error::success();
101}
102
103// This is a reimplementation of NearestSym:
104// https://github.com/microsoft/microsoft-pdb/blob/805655a28bd8198004be2ac27e6e0290121a5e89/PDB/dbi/gsi.cpp#L1492-L1581
105std::optional<std::pair<codeview::PublicSym32, size_t>>
107 uint32_t Offset) const {
108 // The address map is sorted by address, so we can use lower_bound to find the
109 // position. Each element is an offset into the symbols for a public symbol.
110 auto It = llvm::lower_bound(
111 AddressMap, std::tuple(Segment, Offset),
112 [&](support::ulittle32_t Cur, auto Addr) {
113 auto Sym = Symbols.readRecord(Cur.value());
114 if (Sym.kind() != codeview::S_PUB32)
115 return false; // stop here, this is most likely corrupted debug info
116
117 auto Psym =
119 Sym);
120 if (!Psym) {
121 consumeError(Psym.takeError());
122 return false;
123 }
124
125 return std::tie(Psym->Segment, Psym->Offset) < Addr;
126 });
127
128 if (It == AddressMap.end())
129 return std::nullopt;
130
131 auto Sym = Symbols.readRecord(It->value());
132 if (Sym.kind() != codeview::S_PUB32)
133 return std::nullopt; // this is most likely corrupted debug info
134
135 auto MaybePsym =
137 if (!MaybePsym) {
138 consumeError(MaybePsym.takeError());
139 return std::nullopt;
140 }
141 codeview::PublicSym32 Psym = std::move(*MaybePsym);
142
143 if (std::tuple(Segment, Offset) != std::tuple(Psym.Segment, Psym.Offset))
144 return std::nullopt;
145
146 std::ptrdiff_t IterOffset = It - AddressMap.begin();
147 return std::pair{Psym, static_cast<size_t>(IterOffset)};
148}
Provides read only access to a subclass of BinaryStream.
Error readObject(const T *&Dest)
Get a pointer to an object of type T from the underlying stream, as if by memcpy, and store the resul...
Error readArray(ArrayRef< T > &Array, uint32_t NumElements)
Get a reference to a NumElements element array of objects of type T from the underlying stream as if ...
Lightweight error class with error context and mandatory checking.
Definition Error.h:159
static ErrorSuccess success()
Create a success value.
Definition Error.h:336
static Error deserializeAs(CVSymbol Symbol, T &Record)
LLVM_ABI uint32_t getSymHash() const
LLVM_ABI uint32_t getThunkTableOffset() const
LLVM_ABI PublicsStream(std::unique_ptr< msf::MappedBlockStream > Stream)
LLVM_ABI std::optional< std::pair< codeview::PublicSym32, size_t > > findByAddress(const SymbolStream &Symbols, uint16_t Segment, uint32_t Offset) const
Find a public symbol by a segment and offset.
LLVM_ABI uint16_t getThunkTableSection() const
detail::packed_endian_specific_integral< uint32_t, llvm::endianness::little, unaligned > ulittle32_t
Definition Endian.h:286
This is an optimization pass for GlobalISel generic memory operations.
Error joinErrors(Error E1, Error E2)
Concatenate errors.
Definition Error.h:442
Error make_error(ArgTs &&... Args)
Make a Error instance representing failure using the given error info type.
Definition Error.h:340
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
Definition STLExtras.h:1974
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1847
void consumeError(Error Err)
Consume a Error without doing anything.
Definition Error.h:1083
Implement std::hash so that hash_code can be used in STL containers.
Definition BitVector.h:851
Header of the hash tables found in the globals and publics sections.
Definition RawTypes.h:28