DYT/Tool/breakpad/include/common/windows/pdb_source_line_writer.h
2024-11-22 23:19:31 +08:00

357 lines
14 KiB
C++

// Copyright 2006 Google LLC
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
// * Neither the name of Google LLC nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
// PDBSourceLineWriter uses a pdb file produced by Visual C++ to output
// a line/address map for use with BasicSourceLineResolver.
#ifndef COMMON_WINDOWS_PDB_SOURCE_LINE_WRITER_H_
#define COMMON_WINDOWS_PDB_SOURCE_LINE_WRITER_H_
#include <atlcomcli.h>
#include <map>
#include <memory>
#include <string>
#include <unordered_map>
#include <vector>
#include "common/windows/module_info.h"
#include "common/windows/omap.h"
struct IDiaEnumLineNumbers;
struct IDiaSession;
struct IDiaSymbol;
namespace google_breakpad {
using std::map;
using std::vector;
using std::wstring;
using std::unordered_map;
class PDBSourceLineWriter {
public:
enum FileFormat {
PDB_FILE, // a .pdb file containing debug symbols
EXE_FILE, // a .exe or .dll file
ANY_FILE // try PDB_FILE and then EXE_FILE
};
explicit PDBSourceLineWriter(bool handle_inline = false);
~PDBSourceLineWriter();
// Opens the given file. For executable files, the corresponding pdb
// file must be available; Open will be if it is not.
// If there is already a pdb file open, it is automatically closed.
// Returns true on success.
bool Open(const wstring& file, FileFormat format);
// Closes the current pdb file and its associated resources.
void Close();
// Sets the code file full path. This is optional for 32-bit modules. It is
// also optional for 64-bit modules when there is an executable file stored
// in the same directory as the PDB file. It is only required for 64-bit
// modules when the executable file is not in the same location as the PDB
// file and it must be called after Open() and before WriteMap().
// If Open() was called for an executable file, then it is an error to call
// SetCodeFile() with a different file path and it will return false.
bool SetCodeFile(const wstring& exe_file);
// Writes a Breakpad symbol file from the current pdb file to |symbol_file|.
// Returns true on success.
bool WriteSymbols(FILE *symbol_file);
// Retrieves information about the module's debugging file. Returns
// true on success and false on failure.
bool GetModuleInfo(PDBModuleInfo *info);
// Retrieves information about the module's PE file. Returns
// true on success and false on failure.
bool GetPEInfo(PEModuleInfo *info);
// Sets uses_guid to true if the opened file uses a new-style CodeView
// record with a 128-bit GUID, or false if the opened file uses an old-style
// CodeView record. When no GUID is available, a 32-bit signature should be
// used to identify the module instead. If the information cannot be
// determined, this method returns false.
bool UsesGUID(bool *uses_guid);
private:
// InlineOrigin represents INLINE_ORIGIN record in a symbol file. It's an
// inlined function.
struct InlineOrigin {
// The unique id for an InlineOrigin.
int id;
// The name of the inlined function.
wstring name;
};
// Line represents LINE record in a symbol file. It represents a source code
// line.
struct Line {
// The relative address of a line.
DWORD rva;
// The number bytes this line has.
DWORD length;
// The source line number.
DWORD line_num;
// The source file id where the source line is located at.
DWORD file_id;
};
// Inline represents INLINE record in a symbol file.
class Inline {
public:
explicit Inline(int inline_nest_level);
void SetOriginId(int origin_id);
// Adding inlinee line's range into ranges. If line is adjacent with any
// existing lines, extend the range. Otherwise, add line as a new range.
void ExtendRanges(const Line& line);
void SetCallSiteLine(DWORD call_site_line);
void SetCallSiteFileId(DWORD call_site_file_id);
void SetChildInlines(std::vector<std::unique_ptr<Inline>> child_inlines);
void Print(FILE* output) const;
private:
// The nest level of this inline record.
int inline_nest_level_;
// The source line number at where this inlined function is called.
DWORD call_site_line_ = 0;
// The call site file id at where this inlined function is called.
DWORD call_site_file_id_ = 0;
// The id used for referring to an InlineOrigin.
int origin_id_ = 0;
// A map from rva to length. This is the address ranges covered by this
// Inline.
map<DWORD, DWORD> ranges_;
// The list of direct Inlines inlined inside this Inline.
vector<std::unique_ptr<Inline>> child_inlines_;
};
// Lines represents a map of lines inside a function with rva as the key.
// AddLine function adds a line into the map and ensures that there is no
// overlap between any two lines in the map.
class Lines {
public:
const map<DWORD, Line>& GetLineMap() const { return line_map_; }
// Finds the line from line_map_ that contains the given rva returns its
// line_num. If not found, return 0.
DWORD GetLineNum(DWORD rva) const;
// Finds the line from line_map_ that contains the given rva returns its
// file_id. If not found, return 0.
DWORD GetFileId(DWORD rva) const;
// Add the `line` into line_map_. If the `line` overlaps with existing
// lines, truncate the existing lines and add the given line. It ensures
// that all lines in line_map_ do not overlap with each other. For example,
// suppose there is a line A in the map and we call AddLine with Line B.
// Line A: rva: 100, length: 20, line_num: 10, file_id: 1
// Line B: rva: 105, length: 10, line_num: 4, file_id: 2
// After calling AddLine with Line B, we will have the following lines:
// Line 1: rva: 100, length: 5, line_num: 10, file_id: 1
// Line 2: rva: 105, length: 10, line_num: 4, file_id: 2
// Line 3: rva: 115, length: 5, line_num: 10, file_id: 1
void AddLine(const Line& line);
private:
// Finds the line from line_map_ that contains the given rva. If not found,
// return nullptr.
const Line* GetLine(DWORD rva) const;
// The key is rva. AddLine function ensures that any two lines in the map do
// not overlap.
map<DWORD, Line> line_map_;
};
// Construct Line from IDiaLineNumber. The output Line is stored at line.
// Return true on success.
bool GetLine(IDiaLineNumber* dia_line, Line* line) const;
// Construct Lines from IDiaEnumLineNumbers. The list of Lines are stored at
// line_list.
// Returns true on success.
bool GetLines(IDiaEnumLineNumbers* lines, Lines* line_list) const;
// Outputs the line/address pairs for each line in the enumerator.
void PrintLines(const Lines& lines) const;
// Outputs a function address and name, followed by its source line list.
// block can be the same object as function, or it can be a reference to a
// code block that is lexically part of this function, but resides at a
// separate address. If has_multiple_symbols is true, this function's
// instructions correspond to multiple symbols. Returns true on success.
bool PrintFunction(IDiaSymbol *function, IDiaSymbol *block,
bool has_multiple_symbols);
// Outputs all functions as described above. Returns true on success.
bool PrintFunctions();
// Outputs all of the source files in the session's pdb file.
// Returns true on success.
bool PrintSourceFiles();
// Output all inline origins.
void PrintInlineOrigins() const;
// Retrieve inlines inside the given block. It also adds inlinee lines to
// `line_list` since inner lines are more precise source location. If the
// block has children wih SymTagInlineSite Tag, it will recursively (DFS) call
// itself with each child as first argument. Returns true on success.
// `block`: the IDiaSymbol that may have inline sites.
// `line_list`: the list of lines inside current function.
// `inline_nest_level`: the nest level of block's Inlines.
// `inlines`: the vector to store the list of inlines for the block.
bool GetInlines(IDiaSymbol* block,
Lines* line_list,
int inline_nest_level,
vector<std::unique_ptr<Inline>>* inlines);
// Outputs all inlines.
void PrintInlines(const vector<std::unique_ptr<Inline>>& inlines) const;
// Outputs all of the frame information necessary to construct stack
// backtraces in the absence of frame pointers. For x86 data stored in
// .pdb files. Returns true on success.
bool PrintFrameDataUsingPDB();
// Outputs all of the frame information necessary to construct stack
// backtraces in the absence of frame pointers. For x64 data stored in
// .exe, .dll files. Returns true on success.
bool PrintFrameDataUsingEXE();
// Outputs all of the frame information necessary to construct stack
// backtraces in the absence of frame pointers. Returns true on success.
bool PrintFrameData();
// Outputs a single public symbol address and name, if the symbol corresponds
// to a code address. Returns true on success. If symbol is does not
// correspond to code, returns true without outputting anything. If
// has_multiple_symbols is true, the symbol corresponds to a code address and
// the instructions correspond to multiple symbols.
bool PrintCodePublicSymbol(IDiaSymbol *symbol, bool has_multiple_symbols);
// Outputs a line identifying the PDB file that is being dumped, along with
// its uuid and age.
bool PrintPDBInfo();
// Outputs a line identifying the PE file corresponding to the PDB
// file that is being dumped, along with its code identifier,
// which consists of its timestamp and file size.
bool PrintPEInfo();
// Returns true if this filename has already been seen,
// and an ID is stored for it, or false if it has not.
bool FileIDIsCached(const wstring& file) {
return unique_files_.find(file) != unique_files_.end();
}
// Cache this filename and ID for later reuse.
void CacheFileID(const wstring& file, DWORD id) {
unique_files_[file] = id;
}
// Store this ID in the cache as a duplicate for this filename.
void StoreDuplicateFileID(const wstring& file, DWORD id) {
unordered_map<wstring, DWORD>::iterator iter = unique_files_.find(file);
if (iter != unique_files_.end()) {
// map this id to the previously seen one
file_ids_[id] = iter->second;
}
}
// Given a file's unique ID, return the ID that should be used to
// reference it. There may be multiple files with identical filenames
// but different unique IDs. The cache attempts to coalesce these into
// one ID per unique filename.
DWORD GetRealFileID(DWORD id) const {
unordered_map<DWORD, DWORD>::const_iterator iter = file_ids_.find(id);
if (iter == file_ids_.end())
return id;
return iter->second;
}
// Find the PE file corresponding to the loaded PDB file, and
// set the code_file_ member. Returns false on failure.
bool FindPEFile();
// Returns the function name for a symbol. If possible, the name is
// undecorated. If the symbol's decorated form indicates the size of
// parameters on the stack, this information is returned in stack_param_size.
// Returns true on success. If the symbol doesn't encode parameter size
// information, stack_param_size is set to -1.
static bool GetSymbolFunctionName(IDiaSymbol *function, BSTR *name,
int *stack_param_size);
// Returns the number of bytes of stack space used for a function's
// parameters. function must have the tag SymTagFunction. In the event of
// a failure, returns 0, which is also a valid number of bytes.
static int GetFunctionStackParamSize(IDiaSymbol *function);
// The filename of the PE file corresponding to the currently-open
// pdb file.
wstring code_file_;
// The session for the currently-open pdb file.
CComPtr<IDiaSession> session_;
// The current output file for this WriteMap invocation.
FILE *output_;
// There may be many duplicate filenames with different IDs.
// This maps from the DIA "unique ID" to a single ID per unique
// filename.
unordered_map<DWORD, DWORD> file_ids_;
// This maps unique filenames to file IDs.
unordered_map<wstring, DWORD> unique_files_;
// The INLINE_ORIGINS records. The key is the function name.
std::map<wstring, InlineOrigin> inline_origins_;
// This is used for calculating post-transform symbol addresses and lengths.
ImageMap image_map_;
// If we should output INLINE/INLINE_ORIGIN records
bool handle_inline_;
// Disallow copy ctor and operator=
PDBSourceLineWriter(const PDBSourceLineWriter&);
void operator=(const PDBSourceLineWriter&);
};
} // namespace google_breakpad
#endif // COMMON_WINDOWS_PDB_SOURCE_LINE_WRITER_H_