//===-- SymbolFileBreakpad.cpp ----------------------------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "Plugins/SymbolFile/Breakpad/SymbolFileBreakpad.h" #include "Plugins/ObjectFile/Breakpad/BreakpadRecords.h" #include "Plugins/ObjectFile/Breakpad/ObjectFileBreakpad.h" #include "lldb/Core/Module.h" #include "lldb/Core/PluginManager.h" #include "lldb/Core/Section.h" #include "lldb/Host/FileSystem.h" #include "lldb/Symbol/CompileUnit.h" #include "lldb/Symbol/ObjectFile.h" #include "lldb/Symbol/PostfixExpression.h" #include "lldb/Symbol/SymbolVendor.h" #include "lldb/Symbol/TypeMap.h" #include "lldb/Utility/Log.h" #include "lldb/Utility/StreamString.h" #include "llvm/ADT/StringExtras.h" using namespace lldb; using namespace lldb_private; using namespace lldb_private::breakpad; class SymbolFileBreakpad::LineIterator { public: // begin iterator for sections of given type LineIterator(ObjectFile &obj, Record::Kind section_type) : m_obj(&obj), m_section_type(toString(section_type)), m_next_section_idx(0), m_next_line(llvm::StringRef::npos) { ++*this; } // An iterator starting at the position given by the bookmark. LineIterator(ObjectFile &obj, Record::Kind section_type, Bookmark bookmark); // end iterator explicit LineIterator(ObjectFile &obj) : m_obj(&obj), m_next_section_idx(m_obj->GetSectionList()->GetNumSections(0)), m_current_line(llvm::StringRef::npos), m_next_line(llvm::StringRef::npos) {} friend bool operator!=(const LineIterator &lhs, const LineIterator &rhs) { assert(lhs.m_obj == rhs.m_obj); if (lhs.m_next_section_idx != rhs.m_next_section_idx) return true; if (lhs.m_current_line != rhs.m_current_line) return true; assert(lhs.m_next_line == rhs.m_next_line); return false; } const LineIterator &operator++(); llvm::StringRef operator*() const { return m_section_text.slice(m_current_line, m_next_line); } Bookmark GetBookmark() const { return Bookmark{m_next_section_idx, m_current_line}; } private: ObjectFile *m_obj; ConstString m_section_type; uint32_t m_next_section_idx; llvm::StringRef m_section_text; size_t m_current_line; size_t m_next_line; void FindNextLine() { m_next_line = m_section_text.find('\n', m_current_line); if (m_next_line != llvm::StringRef::npos) { ++m_next_line; if (m_next_line >= m_section_text.size()) m_next_line = llvm::StringRef::npos; } } }; SymbolFileBreakpad::LineIterator::LineIterator(ObjectFile &obj, Record::Kind section_type, Bookmark bookmark) : m_obj(&obj), m_section_type(toString(section_type)), m_next_section_idx(bookmark.section), m_current_line(bookmark.offset) { Section § = *obj.GetSectionList()->GetSectionAtIndex(m_next_section_idx - 1); assert(sect.GetName() == m_section_type); DataExtractor data; obj.ReadSectionData(§, data); m_section_text = toStringRef(data.GetData()); assert(m_current_line < m_section_text.size()); FindNextLine(); } const SymbolFileBreakpad::LineIterator & SymbolFileBreakpad::LineIterator::operator++() { const SectionList &list = *m_obj->GetSectionList(); size_t num_sections = list.GetNumSections(0); while (m_next_line != llvm::StringRef::npos || m_next_section_idx < num_sections) { if (m_next_line != llvm::StringRef::npos) { m_current_line = m_next_line; FindNextLine(); return *this; } Section § = *list.GetSectionAtIndex(m_next_section_idx++); if (sect.GetName() != m_section_type) continue; DataExtractor data; m_obj->ReadSectionData(§, data); m_section_text = toStringRef(data.GetData()); m_next_line = 0; } // We've reached the end. m_current_line = m_next_line; return *this; } llvm::iterator_range SymbolFileBreakpad::lines(Record::Kind section_type) { return llvm::make_range(LineIterator(*m_obj_file, section_type), LineIterator(*m_obj_file)); } namespace { // A helper class for constructing the list of support files for a given compile // unit. class SupportFileMap { public: // Given a breakpad file ID, return a file ID to be used in the support files // for this compile unit. size_t operator[](size_t file) { return m_map.try_emplace(file, m_map.size() + 1).first->second; } // Construct a FileSpecList containing only the support files relevant for // this compile unit (in the correct order). FileSpecList translate(const FileSpec &cu_spec, llvm::ArrayRef all_files); private: llvm::DenseMap m_map; }; } // namespace FileSpecList SupportFileMap::translate(const FileSpec &cu_spec, llvm::ArrayRef all_files) { std::vector result; result.resize(m_map.size() + 1); result[0] = cu_spec; for (const auto &KV : m_map) { if (KV.first < all_files.size()) result[KV.second] = all_files[KV.first]; } return FileSpecList(std::move(result)); } void SymbolFileBreakpad::Initialize() { PluginManager::RegisterPlugin(GetPluginNameStatic(), GetPluginDescriptionStatic(), CreateInstance, DebuggerInitialize); } void SymbolFileBreakpad::Terminate() { PluginManager::UnregisterPlugin(CreateInstance); } ConstString SymbolFileBreakpad::GetPluginNameStatic() { static ConstString g_name("breakpad"); return g_name; } uint32_t SymbolFileBreakpad::CalculateAbilities() { if (!m_obj_file) return 0; if (m_obj_file->GetPluginName() != ObjectFileBreakpad::GetPluginNameStatic()) return 0; return CompileUnits | Functions | LineTables; } uint32_t SymbolFileBreakpad::GetNumCompileUnits() { ParseCUData(); return m_cu_data->GetSize(); } CompUnitSP SymbolFileBreakpad::ParseCompileUnitAtIndex(uint32_t index) { if (index >= m_cu_data->GetSize()) return nullptr; CompUnitData &data = m_cu_data->GetEntryRef(index).data; ParseFileRecords(); FileSpec spec; // The FileSpec of the compile unit will be the file corresponding to the // first LINE record. LineIterator It(*m_obj_file, Record::Func, data.bookmark), End(*m_obj_file); assert(Record::classify(*It) == Record::Func); ++It; // Skip FUNC record. if (It != End) { auto record = LineRecord::parse(*It); if (record && record->FileNum < m_files->size()) spec = (*m_files)[record->FileNum]; } auto cu_sp = std::make_shared(m_obj_file->GetModule(), /*user_data*/ nullptr, spec, index, eLanguageTypeUnknown, /*is_optimized*/ eLazyBoolNo); GetSymbolVendor().SetCompileUnitAtIndex(index, cu_sp); return cu_sp; } size_t SymbolFileBreakpad::ParseFunctions(CompileUnit &comp_unit) { // TODO return 0; } bool SymbolFileBreakpad::ParseLineTable(CompileUnit &comp_unit) { CompUnitData &data = m_cu_data->GetEntryRef(comp_unit.GetID()).data; if (!data.line_table_up) ParseLineTableAndSupportFiles(comp_unit, data); comp_unit.SetLineTable(data.line_table_up.release()); return true; } bool SymbolFileBreakpad::ParseSupportFiles(CompileUnit &comp_unit, FileSpecList &support_files) { CompUnitData &data = m_cu_data->GetEntryRef(comp_unit.GetID()).data; if (!data.support_files) ParseLineTableAndSupportFiles(comp_unit, data); support_files = std::move(*data.support_files); return true; } uint32_t SymbolFileBreakpad::ResolveSymbolContext(const Address &so_addr, SymbolContextItem resolve_scope, SymbolContext &sc) { if (!(resolve_scope & (eSymbolContextCompUnit | eSymbolContextLineEntry))) return 0; ParseCUData(); uint32_t idx = m_cu_data->FindEntryIndexThatContains(so_addr.GetFileAddress()); if (idx == UINT32_MAX) return 0; sc.comp_unit = GetSymbolVendor().GetCompileUnitAtIndex(idx).get(); SymbolContextItem result = eSymbolContextCompUnit; if (resolve_scope & eSymbolContextLineEntry) { if (sc.comp_unit->GetLineTable()->FindLineEntryByAddress(so_addr, sc.line_entry)) { result |= eSymbolContextLineEntry; } } return result; } uint32_t SymbolFileBreakpad::ResolveSymbolContext( const FileSpec &file_spec, uint32_t line, bool check_inlines, lldb::SymbolContextItem resolve_scope, SymbolContextList &sc_list) { if (!(resolve_scope & eSymbolContextCompUnit)) return 0; uint32_t old_size = sc_list.GetSize(); for (size_t i = 0, size = GetNumCompileUnits(); i < size; ++i) { CompileUnit &cu = *GetSymbolVendor().GetCompileUnitAtIndex(i); cu.ResolveSymbolContext(file_spec, line, check_inlines, /*exact*/ false, resolve_scope, sc_list); } return sc_list.GetSize() - old_size; } uint32_t SymbolFileBreakpad::FindFunctions( ConstString name, const CompilerDeclContext *parent_decl_ctx, FunctionNameType name_type_mask, bool include_inlines, bool append, SymbolContextList &sc_list) { // TODO if (!append) sc_list.Clear(); return sc_list.GetSize(); } uint32_t SymbolFileBreakpad::FindFunctions(const RegularExpression ®ex, bool include_inlines, bool append, SymbolContextList &sc_list) { // TODO if (!append) sc_list.Clear(); return sc_list.GetSize(); } uint32_t SymbolFileBreakpad::FindTypes( ConstString name, const CompilerDeclContext *parent_decl_ctx, bool append, uint32_t max_matches, llvm::DenseSet &searched_symbol_files, TypeMap &types) { if (!append) types.Clear(); return types.GetSize(); } size_t SymbolFileBreakpad::FindTypes(const std::vector &context, bool append, TypeMap &types) { if (!append) types.Clear(); return types.GetSize(); } void SymbolFileBreakpad::AddSymbols(Symtab &symtab) { Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SYMBOLS); Module &module = *m_obj_file->GetModule(); addr_t base = GetBaseFileAddress(); if (base == LLDB_INVALID_ADDRESS) { LLDB_LOG(log, "Unable to fetch the base address of object file. Skipping " "symtab population."); return; } const SectionList &list = *module.GetSectionList(); llvm::DenseMap symbols; auto add_symbol = [&](addr_t address, llvm::Optional size, llvm::StringRef name) { address += base; SectionSP section_sp = list.FindSectionContainingFileAddress(address); if (!section_sp) { LLDB_LOG(log, "Ignoring symbol {0}, whose address ({1}) is outside of the " "object file. Mismatched symbol file?", name, address); return; } symbols.try_emplace( address, /*symID*/ 0, Mangled(name, /*is_mangled*/ false), eSymbolTypeCode, /*is_global*/ true, /*is_debug*/ false, /*is_trampoline*/ false, /*is_artificial*/ false, AddressRange(section_sp, address - section_sp->GetFileAddress(), size.getValueOr(0)), size.hasValue(), /*contains_linker_annotations*/ false, /*flags*/ 0); }; for (llvm::StringRef line : lines(Record::Func)) { if (auto record = FuncRecord::parse(line)) add_symbol(record->Address, record->Size, record->Name); } for (llvm::StringRef line : lines(Record::Public)) { if (auto record = PublicRecord::parse(line)) add_symbol(record->Address, llvm::None, record->Name); else LLDB_LOG(log, "Failed to parse: {0}. Skipping record.", line); } for (auto &KV : symbols) symtab.AddSymbol(std::move(KV.second)); symtab.CalculateSymbolSizes(); } static llvm::Optional> GetRule(llvm::StringRef &unwind_rules) { // Unwind rules are of the form // register1: expression1 register2: expression2 ... // We assume none of the tokens in expression end with a colon. llvm::StringRef lhs, rest; std::tie(lhs, rest) = getToken(unwind_rules); if (!lhs.consume_back(":")) return llvm::None; // Seek forward to the next register: expression pair llvm::StringRef::size_type pos = rest.find(": "); if (pos == llvm::StringRef::npos) { // No pair found, this means the rest of the string is a single expression. unwind_rules = llvm::StringRef(); return std::make_pair(lhs, rest); } // Go back one token to find the end of the current rule. pos = rest.rfind(' ', pos); if (pos == llvm::StringRef::npos) return llvm::None; llvm::StringRef rhs = rest.take_front(pos); unwind_rules = rest.drop_front(pos); return std::make_pair(lhs, rhs); } static const RegisterInfo * ResolveRegister(const SymbolFile::RegisterInfoResolver &resolver, llvm::StringRef name) { if (name.consume_front("$")) return resolver.ResolveName(name); return nullptr; } static const RegisterInfo * ResolveRegisterOrRA(const SymbolFile::RegisterInfoResolver &resolver, llvm::StringRef name) { if (name == ".ra") return resolver.ResolveNumber(eRegisterKindGeneric, LLDB_REGNUM_GENERIC_PC); return ResolveRegister(resolver, name); } bool SymbolFileBreakpad::ParseUnwindRow(llvm::StringRef unwind_rules, const RegisterInfoResolver &resolver, UnwindPlan::Row &row) { Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SYMBOLS); llvm::BumpPtrAllocator node_alloc; while (auto rule = GetRule(unwind_rules)) { node_alloc.Reset(); llvm::StringRef lhs = rule->first; postfix::Node *rhs = postfix::Parse(rule->second, node_alloc); if (!rhs) { LLDB_LOG(log, "Could not parse `{0}` as unwind rhs.", rule->second); return false; } bool success = postfix::ResolveSymbols( rhs, [&](postfix::SymbolNode &symbol) -> postfix::Node * { llvm::StringRef name = symbol.GetName(); if (name == ".cfa" && lhs != ".cfa") return postfix::MakeNode(node_alloc); if (const RegisterInfo *info = ResolveRegister(resolver, name)) { return postfix::MakeNode( node_alloc, info->kinds[eRegisterKindLLDB]); } return nullptr; }); if (!success) { LLDB_LOG(log, "Resolving symbols in `{0}` failed.", rule->second); return false; } ArchSpec arch = m_obj_file->GetArchitecture(); StreamString dwarf(Stream::eBinary, arch.GetAddressByteSize(), arch.GetByteOrder()); ToDWARF(*rhs, dwarf); uint8_t *saved = m_allocator.Allocate(dwarf.GetSize()); std::memcpy(saved, dwarf.GetData(), dwarf.GetSize()); if (lhs == ".cfa") { row.GetCFAValue().SetIsDWARFExpression(saved, dwarf.GetSize()); } else if (const RegisterInfo *info = ResolveRegisterOrRA(resolver, lhs)) { UnwindPlan::Row::RegisterLocation loc; loc.SetIsDWARFExpression(saved, dwarf.GetSize()); row.SetRegisterInfo(info->kinds[eRegisterKindLLDB], loc); } else LLDB_LOG(log, "Invalid register `{0}` in unwind rule.", lhs); } if (unwind_rules.empty()) return true; LLDB_LOG(log, "Could not parse `{0}` as an unwind rule.", unwind_rules); return false; } UnwindPlanSP SymbolFileBreakpad::GetUnwindPlan(const Address &address, const RegisterInfoResolver &resolver) { ParseUnwindData(); const UnwindMap::Entry *entry = m_unwind_data->FindEntryThatContains(address.GetFileAddress()); if (!entry) return nullptr; addr_t base = GetBaseFileAddress(); if (base == LLDB_INVALID_ADDRESS) return nullptr; LineIterator It(*m_obj_file, Record::StackCFI, entry->data), End(*m_obj_file); llvm::Optional init_record = StackCFIRecord::parse(*It); assert(init_record.hasValue()); assert(init_record->Size.hasValue()); auto plan_sp = std::make_shared(lldb::eRegisterKindLLDB); plan_sp->SetSourceName("breakpad STACK CFI"); plan_sp->SetUnwindPlanValidAtAllInstructions(eLazyBoolNo); plan_sp->SetSourcedFromCompiler(eLazyBoolYes); plan_sp->SetPlanValidAddressRange( AddressRange(base + init_record->Address, *init_record->Size, m_obj_file->GetModule()->GetSectionList())); auto row_sp = std::make_shared(); row_sp->SetOffset(0); if (!ParseUnwindRow(init_record->UnwindRules, resolver, *row_sp)) return nullptr; plan_sp->AppendRow(row_sp); for (++It; It != End; ++It) { llvm::Optional record = StackCFIRecord::parse(*It); if (!record.hasValue()) return nullptr; if (record->Size.hasValue()) break; row_sp = std::make_shared(*row_sp); row_sp->SetOffset(record->Address - init_record->Address); if (!ParseUnwindRow(record->UnwindRules, resolver, *row_sp)) return nullptr; plan_sp->AppendRow(row_sp); } return plan_sp; } SymbolVendor &SymbolFileBreakpad::GetSymbolVendor() { return *m_obj_file->GetModule()->GetSymbolVendor(); } addr_t SymbolFileBreakpad::GetBaseFileAddress() { return m_obj_file->GetModule() ->GetObjectFile() ->GetBaseAddress() .GetFileAddress(); } // Parse out all the FILE records from the breakpad file. These will be needed // when constructing the support file lists for individual compile units. void SymbolFileBreakpad::ParseFileRecords() { if (m_files) return; m_files.emplace(); Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SYMBOLS); for (llvm::StringRef line : lines(Record::File)) { auto record = FileRecord::parse(line); if (!record) { LLDB_LOG(log, "Failed to parse: {0}. Skipping record.", line); continue; } if (record->Number >= m_files->size()) m_files->resize(record->Number + 1); FileSpec::Style style = FileSpec::GuessPathStyle(record->Name) .getValueOr(FileSpec::Style::native); (*m_files)[record->Number] = FileSpec(record->Name, style); } } void SymbolFileBreakpad::ParseCUData() { if (m_cu_data) return; m_cu_data.emplace(); Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SYMBOLS); addr_t base = GetBaseFileAddress(); if (base == LLDB_INVALID_ADDRESS) { LLDB_LOG(log, "SymbolFile parsing failed: Unable to fetch the base address " "of object file."); } // We shall create one compile unit for each FUNC record. So, count the number // of FUNC records, and store them in m_cu_data, together with their ranges. for (LineIterator It(*m_obj_file, Record::Func), End(*m_obj_file); It != End; ++It) { if (auto record = FuncRecord::parse(*It)) { m_cu_data->Append(CompUnitMap::Entry(base + record->Address, record->Size, CompUnitData(It.GetBookmark()))); } else LLDB_LOG(log, "Failed to parse: {0}. Skipping record.", *It); } m_cu_data->Sort(); } // Construct the list of support files and line table entries for the given // compile unit. void SymbolFileBreakpad::ParseLineTableAndSupportFiles(CompileUnit &cu, CompUnitData &data) { addr_t base = GetBaseFileAddress(); assert(base != LLDB_INVALID_ADDRESS && "How did we create compile units without a base address?"); SupportFileMap map; data.line_table_up = llvm::make_unique(&cu); std::unique_ptr line_seq_up( data.line_table_up->CreateLineSequenceContainer()); llvm::Optional next_addr; auto finish_sequence = [&]() { data.line_table_up->AppendLineEntryToSequence( line_seq_up.get(), *next_addr, /*line*/ 0, /*column*/ 0, /*file_idx*/ 0, /*is_start_of_statement*/ false, /*is_start_of_basic_block*/ false, /*is_prologue_end*/ false, /*is_epilogue_begin*/ false, /*is_terminal_entry*/ true); data.line_table_up->InsertSequence(line_seq_up.get()); line_seq_up->Clear(); }; LineIterator It(*m_obj_file, Record::Func, data.bookmark), End(*m_obj_file); assert(Record::classify(*It) == Record::Func); for (++It; It != End; ++It) { auto record = LineRecord::parse(*It); if (!record) break; record->Address += base; if (next_addr && *next_addr != record->Address) { // Discontiguous entries. Finish off the previous sequence and reset. finish_sequence(); } data.line_table_up->AppendLineEntryToSequence( line_seq_up.get(), record->Address, record->LineNum, /*column*/ 0, map[record->FileNum], /*is_start_of_statement*/ true, /*is_start_of_basic_block*/ false, /*is_prologue_end*/ false, /*is_epilogue_begin*/ false, /*is_terminal_entry*/ false); next_addr = record->Address + record->Size; } if (next_addr) finish_sequence(); data.support_files = map.translate(cu, *m_files); } void SymbolFileBreakpad::ParseUnwindData() { if (m_unwind_data) return; m_unwind_data.emplace(); Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SYMBOLS); addr_t base = GetBaseFileAddress(); if (base == LLDB_INVALID_ADDRESS) { LLDB_LOG(log, "SymbolFile parsing failed: Unable to fetch the base address " "of object file."); } for (LineIterator It(*m_obj_file, Record::StackCFI), End(*m_obj_file); It != End; ++It) { if (auto record = StackCFIRecord::parse(*It)) { if (record->Size) m_unwind_data->Append(UnwindMap::Entry( base + record->Address, *record->Size, It.GetBookmark())); } else LLDB_LOG(log, "Failed to parse: {0}. Skipping record.", *It); } m_unwind_data->Sort(); }