-
Notifications
You must be signed in to change notification settings - Fork 3
/
pdb.go
289 lines (267 loc) · 9.52 KB
/
pdb.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
// Package pdb provides access to the PDB (Microsoft C/C++ program database)
// file format.
//
// ref: https://www.nationalarchives.gov.uk/pronom/fmt/1078
// ref: https://github.com/Microsoft/microsoft-pdb/blob/master/PDB/msf/msf.cpp
// ref: https://llvm.org/docs/PDB/MsfFile.html
// ref: https://llvm.org/docs/PDB/index.html
package pdb
import (
"bytes"
"encoding/binary"
"encoding/hex"
"io"
"io/ioutil"
"log"
"math"
"os"
"github.com/mewkiz/pkg/term"
"github.com/pkg/errors"
)
var (
// dbg is a logger with the "pdb:" prefix which logs debug messages to standard
// error.
dbg = log.New(os.Stderr, term.CyanBold("pdb:")+" ", 0)
// warn is a logger with the "pdb:" prefix which logs warning messages to
// standard error.
warn = log.New(os.Stderr, term.RedBold("pdb:")+" ", 0)
)
// From https://github.com/microsoft/microsoft-pdb
//
// +============+==============================+=====================================================================+
// | Stream no. | Contents | Short Description |
// +============+==============================+=====================================================================+
// | 1 | Pdb (header) | Version information, and information to connect this PDB to the EXE |
// | 2 | Tpi (Type manager) | All the types used in the executable. |
// | 3 | Dbi (Debug information) | Holds section contributions, and list of ‘Mods’ |
// | 4 | NameMap | Holds a hashed string table |
// | 4-(n+4) | n Mod’s (Module information) | Each Mod stream holds symbols and line numbers for one compiland |
// | n+4 | Global symbol hash | An index that allows searching in global symbols by name |
// | n+5 | Public symbol hash | An index that allows searching in public symbols by addresses |
// | n+6 | Symbol records | Actual symbol records of global and public symbols |
// | n+7 | Type hash | Hash used by the TPI stream. |
// +------------+------------------------------+---------------------------------------------------------------------+
// File is a PDB file.
type File struct {
// File header of MSF.
FileHdr *MSFHeader
// Free page map.
FreePageMap *FreePageMap
// Stream table.
StreamTbl *StreamTable
// Streams.
Streams []Stream
// Contents of underlying PDB file.
Data []byte // TODO: rename to buf
}
// ParseFile parses the given PDB file, reading from pdbPath.
func ParseFile(pdbPath string) (*File, error) {
// Read PDB file contents.
buf, err := ioutil.ReadFile(pdbPath)
if err != nil {
return nil, errors.WithStack(err)
}
file := &File{
Data: buf,
}
// Parse MSF file header.
msfHdr, err := parseMSFHeader(bytes.NewReader(file.Data))
if err != nil {
return nil, errors.WithStack(err)
}
file.FileHdr = msfHdr
// Parse free page map.
freePageMapData := file.readPage(int(file.FileHdr.FreePageMapPageNum))
file.FreePageMap = &FreePageMap{
PageBits: freePageMapData,
}
// Parse stream table.
streamTblData := file.readStreamTable()
streamTbl, err := file.parseStreamTable(bytes.NewReader(streamTblData))
if err != nil {
return nil, errors.WithStack(err)
}
file.StreamTbl = streamTbl
// Parse streams.
for streamNum := 0; streamNum < int(file.StreamTbl.NStreams); streamNum++ {
if err := file.parseStream(streamNum); err != nil {
return nil, errors.WithStack(err)
}
}
return file, nil
}
// readPage returns the contents of the given page.
func (file *File) readPage(pageNum int) []byte {
pageSize := int(file.FileHdr.PageSize)
start := pageNum * pageSize
end := start + pageSize
return file.Data[start:end]
}
// MSF signatures.
const (
msfSignature = "Microsoft C/C++ program database 2.00\r\n\x1a\x4a\x47\x00\x00"
// TODO: define signature for MSFBig.
)
// MSFHeader is the header of a multistream file (MSF). The MSF header is always
// at page 0.
//
// ref: https://llvm.org/docs/PDB/MsfFile.html#the-superblock
// ref: MSF_HDR
type MSFHeader struct {
// File format identifier.
Magic [44]byte
// Page size in bytes.
PageSize int32
// Page number of free page map.
FreePageMapPageNum uint16
// Number of pages.
NPages uint16
// Stream information about the stream table.
StreamTblInfo StreamInfo
// Maps from stream page number to page number.
PageNumMap []uint16 // length: math.Ceil(msfHdr.StreamTblInfo.Size / msfHdr.PageSize)
// align until page boundry.
}
// parseMSFHeader parses the given MSF file header, reading from r.
func parseMSFHeader(r io.Reader) (*MSFHeader, error) {
// Magic.
msfHdr := &MSFHeader{}
if err := binary.Read(r, binary.LittleEndian, &msfHdr.Magic); err != nil {
return nil, errors.WithStack(err)
}
magic := string(msfHdr.Magic[:])
if magic != msfSignature {
return nil, errors.Errorf("invalid MSF signature; expected %q, got %q", msfSignature, magic)
}
// PageSize.
if err := binary.Read(r, binary.LittleEndian, &msfHdr.PageSize); err != nil {
return nil, errors.WithStack(err)
}
// FreePageMapPageNum.
if err := binary.Read(r, binary.LittleEndian, &msfHdr.FreePageMapPageNum); err != nil {
return nil, errors.WithStack(err)
}
// NPages.
if err := binary.Read(r, binary.LittleEndian, &msfHdr.NPages); err != nil {
return nil, errors.WithStack(err)
}
// StreamTblInfo.
if err := binary.Read(r, binary.LittleEndian, &msfHdr.StreamTblInfo); err != nil {
return nil, errors.WithStack(err)
}
// PageNumMap.
streamTblNPages := int(math.Ceil(float64(msfHdr.StreamTblInfo.Size) / float64(msfHdr.PageSize))) // number of pages used by stream table.
msfHdr.PageNumMap = make([]uint16, streamTblNPages)
if err := binary.Read(r, binary.LittleEndian, &msfHdr.PageNumMap); err != nil {
return nil, errors.WithStack(err)
}
// TODO: validate alignment until page boundry to be all zero?
return msfHdr, nil
}
// StreamInfo specifies stream information.
//
// ref: SI_PERSIST
type StreamInfo struct {
// Size in bytes of stream table.
Size int32
// ref: SI_PERSIST.mpspnpn
Unknown int32
}
// FreePageMap specifies what pages are used/unused.
//
// ref: https://llvm.org/docs/PDB/MsfFile.html#the-free-block-map
// ref: FPM
type FreePageMap struct {
// Each bit specifies whether the corresponding page is used or unused.
//
// 0 = used
// 1 = unused
PageBits []byte // length: msfHdr.PageSize
}
// IsFree reports whether the given page number is unused.
func (fpm *FreePageMap) IsFree(pageNum int) bool {
i := pageNum / 8
j := pageNum % 8
mask := uint8(1) << j
return fpm.PageBits[i]&mask != 0
}
// readStreamTable reads the contents of the stream table, concatenating its
// pages together.
func (file *File) readStreamTable() []byte {
streamTblNPages := int(math.Ceil(float64(file.FileHdr.StreamTblInfo.Size) / float64(file.FileHdr.PageSize))) // number of pages used by stream table.
var streamTblData []byte
for streamPageNum := 0; streamPageNum < streamTblNPages; streamPageNum++ {
pageNum := int(file.FileHdr.PageNumMap[streamPageNum])
pageData := file.readPage(pageNum)
streamTblData = append(streamTblData, pageData...)
}
return streamTblData[:file.FileHdr.StreamTblInfo.Size]
}
// StreamNumber is a stream index.
type StreamNumber uint16
//go:generate stringer -linecomment -type StreamID
// StreamID specifies a fixed stream index.
type StreamID uint32
// Fixed stream indices (fixed stream number).
//
// ref: https://llvm.org/docs/PDB/index.html#streams
const (
StreamIDPrevStreamTable StreamID = 0 // previous stream table
StreamIDPDBStream StreamID = 1 // PDB stream
StreamIDTPIStream StreamID = 2 // TPI stream
)
// readStreamData reads the contents of the stream with the given stream number,
// concatenating its pages together.
func (file *File) readStreamData(streamNum int) []byte {
streamInfo := file.StreamTbl.StreamInfos[streamNum]
pageNumMap := file.StreamTbl.PageNumMaps[streamNum]
var streamData []byte
for streamPageNum, pageNum := range pageNumMap {
_ = streamPageNum
pageData := file.readPage(int(pageNum))
streamData = append(streamData, pageData...)
}
return streamData[:streamInfo.Size]
}
// Stream is a stream of a PDB file.
//
// Stream is one of the following types.
//
// *PDBStream
// TODO: add more stream types.
type Stream interface{}
// parseStream parses the stream with the given stream number.
//
// ref: https://llvm.org/docs/PDB/index.html#streams
func (file *File) parseStream(streamNum int) error {
dbg.Println("parseStream")
dbg.Println(" streamNum:", streamNum)
streamData := file.readStreamData(streamNum)
dbg.Print(" streamData:\n", hex.Dump(streamData))
switch StreamID(streamNum) {
// Previous stream table (old MSF stream table)
case StreamIDPrevStreamTable:
prevStreamTbl, err := file.parseStreamTable(bytes.NewReader(streamData))
if err != nil {
return errors.WithStack(err)
}
file.Streams = append(file.Streams, prevStreamTbl)
// PDB stream
case StreamIDPDBStream:
pdbStream, err := file.parsePDBStream(bytes.NewReader(streamData))
if err != nil {
return errors.WithStack(err)
}
file.Streams = append(file.Streams, pdbStream)
// TPI stream
case StreamIDTPIStream:
tpiStream, err := file.parseTPIStream(bytes.NewReader(streamData))
if err != nil {
return errors.WithStack(err)
}
file.Streams = append(file.Streams, tpiStream)
default:
warn.Printf("support for stream number %d not yet implemented", streamNum)
}
return nil
}