mirror of
https://github.com/NohamR/Reclass.git
synced 2026-05-10 19:59:21 +00:00
Replace DIA SDK COM-based PDB importer with RawPDB (MolecularMatters) which reads PDB files directly via memory-mapped I/O. Adds File menu "Import PDB..." dialog with type filtering, selection, and progress. - Vendor raw_pdb into third_party/ - Two-phase API: enumeratePdbTypes() + importPdbSelected() - Full recursive import of structs/unions/arrays/pointers/bitfields - PDB import dialog with name filter, select-all, type count - Benchmark: 1654 types from ntkrnlmp.pdb in 16ms - Reorganize import/export files into src/imports/
239 lines
8.9 KiB
C++
239 lines
8.9 KiB
C++
// Copyright 2011-2022, Molecular Matters GmbH <office@molecular-matters.com>
|
|
// See LICENSE.txt for licensing details (2-clause BSD License: https://opensource.org/licenses/BSD-2-Clause)
|
|
|
|
#include "Examples_PCH.h"
|
|
#include "ExampleTimedScope.h"
|
|
#include "PDB_RawFile.h"
|
|
#include "PDB_DBIStream.h"
|
|
|
|
|
|
namespace
|
|
{
|
|
// we don't have to store std::string in the symbols, since all the data is memory-mapped anyway.
|
|
// we do it in this example to ensure that we don't "cheat" when reading the PDB file. memory-mapped data will only
|
|
// be faulted into the process once it's touched, so actually copying the string data makes us touch the needed data,
|
|
// giving us a real performance measurement.
|
|
struct Symbol
|
|
{
|
|
std::string name;
|
|
uint32_t rva;
|
|
};
|
|
}
|
|
|
|
|
|
void ExampleSymbols(const PDB::RawFile& rawPdbFile, const PDB::DBIStream& dbiStream);
|
|
void ExampleSymbols(const PDB::RawFile& rawPdbFile, const PDB::DBIStream& dbiStream)
|
|
{
|
|
TimedScope total("\nRunning example \"Symbols\"");
|
|
|
|
// in order to keep the example easy to understand, we load the PDB data serially.
|
|
// note that this can be improved a lot by reading streams concurrently.
|
|
|
|
// prepare the image section stream first. it is needed for converting section + offset into an RVA
|
|
TimedScope sectionScope("Reading image section stream");
|
|
const PDB::ImageSectionStream imageSectionStream = dbiStream.CreateImageSectionStream(rawPdbFile);
|
|
sectionScope.Done();
|
|
|
|
|
|
// prepare the module info stream for matching contributions against files
|
|
TimedScope moduleScope("Reading module info stream");
|
|
const PDB::ModuleInfoStream moduleInfoStream = dbiStream.CreateModuleInfoStream(rawPdbFile);
|
|
moduleScope.Done();
|
|
|
|
|
|
// prepare symbol record stream needed by both public and global streams
|
|
TimedScope symbolStreamScope("Reading symbol record stream");
|
|
const PDB::CoalescedMSFStream symbolRecordStream = dbiStream.CreateSymbolRecordStream(rawPdbFile);
|
|
symbolStreamScope.Done();
|
|
|
|
std::vector<Symbol> symbols;
|
|
|
|
// read public symbols
|
|
TimedScope publicScope("Reading public symbol stream");
|
|
const PDB::PublicSymbolStream publicSymbolStream = dbiStream.CreatePublicSymbolStream(rawPdbFile);
|
|
publicScope.Done();
|
|
{
|
|
TimedScope scope("Storing public symbols");
|
|
|
|
const PDB::ArrayView<PDB::HashRecord> hashRecords = publicSymbolStream.GetRecords();
|
|
const size_t count = hashRecords.GetLength();
|
|
|
|
symbols.reserve(count);
|
|
|
|
for (const PDB::HashRecord& hashRecord : hashRecords)
|
|
{
|
|
const PDB::CodeView::DBI::Record* record = publicSymbolStream.GetRecord(symbolRecordStream, hashRecord);
|
|
if (record->header.kind != PDB::CodeView::DBI::SymbolRecordKind::S_PUB32)
|
|
{
|
|
// normally, a PDB only contains S_PUB32 symbols in the public symbol stream, but we have seen PDBs that also store S_CONSTANT as public symbols.
|
|
// ignore these.
|
|
continue;
|
|
}
|
|
|
|
const uint32_t rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_PUB32.section, record->data.S_PUB32.offset);
|
|
if (rva == 0u)
|
|
{
|
|
// certain symbols (e.g. control-flow guard symbols) don't have a valid RVA, ignore those
|
|
continue;
|
|
}
|
|
|
|
symbols.push_back(Symbol { record->data.S_PUB32.name, rva });
|
|
}
|
|
|
|
scope.Done(count);
|
|
}
|
|
|
|
|
|
// read global symbols
|
|
TimedScope globalScope("Reading global symbol stream");
|
|
const PDB::GlobalSymbolStream globalSymbolStream = dbiStream.CreateGlobalSymbolStream(rawPdbFile);
|
|
globalScope.Done();
|
|
{
|
|
TimedScope scope("Storing global symbols");
|
|
|
|
const PDB::ArrayView<PDB::HashRecord> hashRecords = globalSymbolStream.GetRecords();
|
|
const size_t count = hashRecords.GetLength();
|
|
|
|
symbols.reserve(symbols.size() + count);
|
|
|
|
for (const PDB::HashRecord& hashRecord : hashRecords)
|
|
{
|
|
const PDB::CodeView::DBI::Record* record = globalSymbolStream.GetRecord(symbolRecordStream, hashRecord);
|
|
|
|
const char* name = nullptr;
|
|
uint32_t rva = 0u;
|
|
if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_GDATA32)
|
|
{
|
|
name = record->data.S_GDATA32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_GDATA32.section, record->data.S_GDATA32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_GTHREAD32)
|
|
{
|
|
name = record->data.S_GTHREAD32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_GTHREAD32.section, record->data.S_GTHREAD32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LDATA32)
|
|
{
|
|
name = record->data.S_LDATA32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_LDATA32.section, record->data.S_LDATA32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LTHREAD32)
|
|
{
|
|
name = record->data.S_LTHREAD32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_LTHREAD32.section, record->data.S_LTHREAD32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_UDT)
|
|
{
|
|
name = record->data.S_UDT.name;
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_UDT_ST)
|
|
{
|
|
name = record->data.S_UDT_ST.name;
|
|
}
|
|
|
|
if (rva == 0u)
|
|
{
|
|
// certain symbols (e.g. control-flow guard symbols) don't have a valid RVA, ignore those
|
|
continue;
|
|
}
|
|
|
|
symbols.push_back(Symbol { name, rva });
|
|
}
|
|
|
|
scope.Done(count);
|
|
}
|
|
|
|
|
|
// read module symbols
|
|
{
|
|
TimedScope scope("Storing symbols from modules");
|
|
|
|
const PDB::ArrayView<PDB::ModuleInfoStream::Module> modules = moduleInfoStream.GetModules();
|
|
|
|
for (const PDB::ModuleInfoStream::Module& module : modules)
|
|
{
|
|
if (!module.HasSymbolStream())
|
|
{
|
|
continue;
|
|
}
|
|
|
|
const PDB::ModuleSymbolStream moduleSymbolStream = module.CreateSymbolStream(rawPdbFile);
|
|
moduleSymbolStream.ForEachSymbol([&symbols, &imageSectionStream](const PDB::CodeView::DBI::Record* record)
|
|
{
|
|
const char* name = nullptr;
|
|
uint32_t rva = 0u;
|
|
if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_THUNK32)
|
|
{
|
|
if (record->data.S_THUNK32.thunk == PDB::CodeView::DBI::ThunkOrdinal::TrampolineIncremental)
|
|
{
|
|
// we have never seen incremental linking thunks stored inside a S_THUNK32 symbol, but better be safe than sorry
|
|
name = "ILT";
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_THUNK32.section, record->data.S_THUNK32.offset);
|
|
}
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_TRAMPOLINE)
|
|
{
|
|
// incremental linking thunks are stored in the linker module
|
|
name = "ILT";
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_TRAMPOLINE.thunkSection, record->data.S_TRAMPOLINE.thunkOffset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_BLOCK32)
|
|
{
|
|
// blocks never store a name and are only stored for indicating whether other symbols are children of this block
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LABEL32)
|
|
{
|
|
// labels don't have a name
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LPROC32)
|
|
{
|
|
name = record->data.S_LPROC32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_LPROC32.section, record->data.S_LPROC32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_GPROC32)
|
|
{
|
|
name = record->data.S_GPROC32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_GPROC32.section, record->data.S_GPROC32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LPROC32_ID)
|
|
{
|
|
name = record->data.S_LPROC32_ID.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_LPROC32_ID.section, record->data.S_LPROC32_ID.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_GPROC32_ID)
|
|
{
|
|
name = record->data.S_GPROC32_ID.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_GPROC32_ID.section, record->data.S_GPROC32_ID.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_REGREL32)
|
|
{
|
|
name = record->data.S_REGREL32.name;
|
|
// You can only get the address while running the program by checking the register value and adding the offset
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LDATA32)
|
|
{
|
|
name = record->data.S_LDATA32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_LDATA32.section, record->data.S_LDATA32.offset);
|
|
}
|
|
else if (record->header.kind == PDB::CodeView::DBI::SymbolRecordKind::S_LTHREAD32)
|
|
{
|
|
name = record->data.S_LTHREAD32.name;
|
|
rva = imageSectionStream.ConvertSectionOffsetToRVA(record->data.S_LTHREAD32.section, record->data.S_LTHREAD32.offset);
|
|
}
|
|
|
|
if (rva == 0u)
|
|
{
|
|
// certain symbols (e.g. control-flow guard symbols) don't have a valid RVA, ignore those
|
|
return;
|
|
}
|
|
|
|
symbols.push_back(Symbol { name, rva });
|
|
});
|
|
}
|
|
|
|
scope.Done(modules.GetLength());
|
|
}
|
|
|
|
total.Done(symbols.size());
|
|
}
|