summaryrefslogtreecommitdiffstats
path: root/breakpad
diff options
context:
space:
mode:
authorthestig@chromium.org <thestig@chromium.org@0039d316-1c4b-4281-b951-d872f2087c98>2009-05-27 22:10:12 +0000
committerthestig@chromium.org <thestig@chromium.org@0039d316-1c4b-4281-b951-d872f2087c98>2009-05-27 22:10:12 +0000
commite7b755275ea9426d0943b06c66cb861a3a0ca85f (patch)
tree559499db472bd04157d66d83c9ce6f035ae88969 /breakpad
parentc5e1c7a2d5e7c0bd8db8d7fc44dabea13a4a9721 (diff)
downloadchromium_src-e7b755275ea9426d0943b06c66cb861a3a0ca85f.zip
chromium_src-e7b755275ea9426d0943b06c66cb861a3a0ca85f.tar.gz
chromium_src-e7b755275ea9426d0943b06c66cb861a3a0ca85f.tar.bz2
Fork breakpad's dump_syms and related code. Generate XOR of first page of memory instead of MD5 of text section.
BUG=none TEST=none Review URL: http://codereview.chromium.org/113893 git-svn-id: svn://svn.chromium.org/chrome/trunk/src@17031 0039d316-1c4b-4281-b951-d872f2087c98
Diffstat (limited to 'breakpad')
-rw-r--r--breakpad/breakpad.gyp11
-rw-r--r--breakpad/linux/dump_symbols.cc779
-rw-r--r--breakpad/linux/dump_symbols.h47
-rw-r--r--breakpad/linux/dump_syms.cc50
-rw-r--r--breakpad/linux/file_id.cc103
-rw-r--r--breakpad/linux/file_id.h70
6 files changed, 1055 insertions, 5 deletions
diff --git a/breakpad/breakpad.gyp b/breakpad/breakpad.gyp
index a04c2f4..2119204 100644
--- a/breakpad/breakpad.gyp
+++ b/breakpad/breakpad.gyp
@@ -294,7 +294,6 @@
# 'src/tools/linux/symupload/sym_upload.cc',
# 'src/common/linux/http_upload.cc',
# ],
-#
# 'include_dirs': [
# 'src',
# ],
@@ -309,14 +308,16 @@
# 'type': 'executable',
#
# 'sources': [
-# 'src/tools/linux/dump_syms/dump_syms.cc',
-# 'src/common/linux/dump_symbols.cc',
-# 'src/common/linux/file_id.cc',
-# 'src/common/md5.c',
+# 'linux/dump_syms.cc',
+# 'linux/dump_symbols.cc',
+# 'linux/dump_symbols.h',
+# 'linux/file_id.cc',
+# 'linux/file_id.h',
# ],
#
# 'include_dirs': [
# 'src',
+# '..',
# ],
# },
],
diff --git a/breakpad/linux/dump_symbols.cc b/breakpad/linux/dump_symbols.cc
new file mode 100644
index 0000000..2ad4bff
--- /dev/null
+++ b/breakpad/linux/dump_symbols.cc
@@ -0,0 +1,779 @@
+// Copyright (c) 2006, 2009, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+// * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+// * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+// * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#include "breakpad/linux/dump_symbols.h"
+
+#include <a.out.h>
+#include <assert.h>
+#include <cxxabi.h>
+#include <elf.h>
+#include <errno.h>
+#include <fcntl.h>
+#include <link.h>
+#include <stab.h>
+#include <string.h>
+#include <sys/mman.h>
+#include <sys/stat.h>
+#include <sys/types.h>
+#include <unistd.h>
+
+#include <algorithm>
+#include <cstdarg>
+#include <cstdio>
+#include <cstdlib>
+#include <functional>
+#include <list>
+#include <vector>
+
+#include "breakpad/linux/file_id.h"
+#include "common/linux/guid_creator.h"
+
+// This namespace contains helper functions.
+namespace {
+
+// Infomation of a line.
+struct LineInfo {
+ // The index into string table for the name of the source file which
+ // this line belongs to.
+ // Load from stab symbol.
+ uint32_t source_name_index;
+ // Offset from start of the function.
+ // Load from stab symbol.
+ ElfW(Off) rva_to_func;
+ // Offset from base of the loading binary.
+ ElfW(Off) rva_to_base;
+ // Size of the line.
+ // It is the difference of the starting address of the line and starting
+ // address of the next N_SLINE, N_FUN or N_SO.
+ uint32_t size;
+ // Line number.
+ uint32_t line_num;
+ // Id of the source file for this line.
+ int source_id;
+};
+
+typedef std::list<struct LineInfo> LineInfoList;
+
+// Information of a function.
+struct FuncInfo {
+ // Name of the function.
+ const char* name;
+ // Offset from the base of the loading address.
+ ElfW(Off) rva_to_base;
+ // Virtual address of the function.
+ // Load from stab symbol.
+ ElfW(Addr) addr;
+ // Size of the function.
+ // It is the difference of the starting address of the function and starting
+ // address of the next N_FUN or N_SO.
+ uint32_t size;
+ // Total size of stack parameters.
+ uint32_t stack_param_size;
+ // Is there any lines included from other files?
+ bool has_sol;
+ // Line information array.
+ LineInfoList line_info;
+};
+
+typedef std::list<struct FuncInfo> FuncInfoList;
+
+// Information of a source file.
+struct SourceFileInfo {
+ // Name string index into the string table.
+ uint32_t name_index;
+ // Name of the source file.
+ const char* name;
+ // Starting address of the source file.
+ ElfW(Addr) addr;
+ // Id of the source file.
+ int source_id;
+ // Functions information.
+ FuncInfoList func_info;
+};
+
+typedef std::list<struct SourceFileInfo> SourceFileInfoList;
+
+// Information of a symbol table.
+// This is the root of all types of symbol.
+struct SymbolInfo {
+ SourceFileInfoList source_file_info;
+
+ // The next source id for newly found source file.
+ int next_source_id;
+};
+
+// Stab section name.
+static const char* kStabName = ".stab";
+
+// Demangle using abi call.
+// Older GCC may not support it.
+static std::string Demangle(const char* mangled) {
+ int status = 0;
+ char* demangled = abi::__cxa_demangle(mangled, NULL, NULL, &status);
+ if (status == 0 && demangled != NULL) {
+ std::string str(demangled);
+ free(demangled);
+ return str;
+ }
+ return std::string(mangled);
+}
+
+// Fix offset into virtual address by adding the mapped base into offsets.
+// Make life easier when want to find something by offset.
+static void FixAddress(void* obj_base) {
+ ElfW(Word) base = reinterpret_cast<ElfW(Word)>(obj_base);
+ ElfW(Ehdr)* elf_header = static_cast<ElfW(Ehdr)* >(obj_base);
+ elf_header->e_phoff += base;
+ elf_header->e_shoff += base;
+ ElfW(Shdr)* sections = reinterpret_cast<ElfW(Shdr)* >(elf_header->e_shoff);
+ for (int i = 0; i < elf_header->e_shnum; ++i)
+ sections[i].sh_offset += base;
+}
+
+// Find the prefered loading address of the binary.
+static ElfW(Addr) GetLoadingAddress(const ElfW(Phdr)* program_headers,
+ int nheader) {
+ for (int i = 0; i < nheader; ++i) {
+ const ElfW(Phdr)& header = program_headers[i];
+ // For executable, it is the PT_LOAD segment with offset to zero.
+ if (header.p_type == PT_LOAD &&
+ header.p_offset == 0)
+ return header.p_vaddr;
+ }
+ // For other types of ELF, return 0.
+ return 0;
+}
+
+static bool WriteFormat(int fd, const char* fmt, ...) {
+ va_list list;
+ char buffer[4096];
+ ssize_t expected, written;
+ va_start(list, fmt);
+ vsnprintf(buffer, sizeof(buffer), fmt, list);
+ expected = strlen(buffer);
+ written = write(fd, buffer, strlen(buffer));
+ va_end(list);
+ return expected == written;
+}
+
+static bool IsValidElf(const ElfW(Ehdr)* elf_header) {
+ return memcmp(elf_header, ELFMAG, SELFMAG) == 0;
+}
+
+static const ElfW(Shdr)* FindSectionByName(const char* name,
+ const ElfW(Shdr)* sections,
+ const ElfW(Shdr)* strtab,
+ int nsection) {
+ assert(name != NULL);
+ assert(sections != NULL);
+ assert(nsection > 0);
+
+ int name_len = strlen(name);
+ if (name_len == 0)
+ return NULL;
+
+ for (int i = 0; i < nsection; ++i) {
+ const char* section_name =
+ reinterpret_cast<char*>(strtab->sh_offset + sections[i].sh_name);
+ if (!strncmp(name, section_name, name_len))
+ return sections + i;
+ }
+ return NULL;
+}
+
+// TODO(liuli): Computer the stack parameter size.
+// Expect parameter variables are immediately following the N_FUN symbol.
+// Will need to parse the type information to get a correct size.
+static int LoadStackParamSize(struct nlist* list,
+ struct nlist* list_end,
+ struct FuncInfo* func_info) {
+ struct nlist* cur_list = list;
+ assert(cur_list->n_type == N_FUN);
+ ++cur_list;
+ int step = 1;
+ while (cur_list < list_end && cur_list->n_type == N_PSYM) {
+ ++cur_list;
+ ++step;
+ }
+ func_info->stack_param_size = 0;
+ return step;
+}
+
+static int LoadLineInfo(struct nlist* list,
+ struct nlist* list_end,
+ const struct SourceFileInfo& source_file_info,
+ struct FuncInfo* func_info) {
+ struct nlist* cur_list = list;
+ func_info->has_sol = false;
+ // Records which source file the following lines belongs. Default
+ // to the file we are handling. This helps us handling inlined source.
+ // When encountering N_SOL, we will change this to the source file
+ // specified by N_SOL.
+ int current_source_name_index = source_file_info.name_index;
+ do {
+ // Skip non line information.
+ while (cur_list < list_end && cur_list->n_type != N_SLINE) {
+ // Only exit when got another function, or source file.
+ if (cur_list->n_type == N_FUN || cur_list->n_type == N_SO)
+ return cur_list - list;
+ // N_SOL means source lines following it will be from
+ // another source file.
+ if (cur_list->n_type == N_SOL) {
+ func_info->has_sol = true;
+
+ if (cur_list->n_un.n_strx > 0 &&
+ cur_list->n_un.n_strx != current_source_name_index) {
+ // The following lines will be from this source file.
+ current_source_name_index = cur_list->n_un.n_strx;
+ }
+ }
+ ++cur_list;
+ }
+ struct LineInfo line;
+ while (cur_list < list_end && cur_list->n_type == N_SLINE) {
+ line.source_name_index = current_source_name_index;
+ line.rva_to_func = cur_list->n_value;
+ // n_desc is a signed short
+ line.line_num = (unsigned short)cur_list->n_desc;
+ // Don't set it here.
+ // Will be processed in later pass.
+ line.source_id = -1;
+ func_info->line_info.push_back(line);
+ ++cur_list;
+ }
+ } while (list < list_end);
+
+ return cur_list - list;
+}
+
+static int LoadFuncSymbols(struct nlist* list,
+ struct nlist* list_end,
+ const ElfW(Shdr)* stabstr_section,
+ struct SourceFileInfo* source_file_info) {
+ struct nlist* cur_list = list;
+ assert(cur_list->n_type == N_SO);
+ ++cur_list;
+ source_file_info->func_info.clear();
+ while (cur_list < list_end) {
+ // Go until the function symbol.
+ while (cur_list < list_end && cur_list->n_type != N_FUN) {
+ if (cur_list->n_type == N_SO) {
+ return cur_list - list;
+ }
+ ++cur_list;
+ continue;
+ }
+ if (cur_list->n_type == N_FUN) {
+ struct FuncInfo func_info;
+ func_info.name =
+ reinterpret_cast<char* >(cur_list->n_un.n_strx +
+ stabstr_section->sh_offset);
+ func_info.addr = cur_list->n_value;
+ func_info.rva_to_base = 0;
+ func_info.size = 0;
+ func_info.stack_param_size = 0;
+ func_info.has_sol = 0;
+
+ // Stack parameter size.
+ cur_list += LoadStackParamSize(cur_list, list_end, &func_info);
+ // Line info.
+ cur_list += LoadLineInfo(cur_list,
+ list_end,
+ *source_file_info,
+ &func_info);
+
+ // Functions in this module should have address bigger than the module
+ // startring address.
+ // There maybe a lot of duplicated entry for a function in the symbol,
+ // only one of them can met this.
+ if (func_info.addr >= source_file_info->addr) {
+ source_file_info->func_info.push_back(func_info);
+ }
+ }
+ }
+ return cur_list - list;
+}
+
+// Comapre the address.
+// The argument should have a memeber named "addr"
+template<class T1, class T2>
+static bool CompareAddress(T1* a, T2* b) {
+ return a->addr < b->addr;
+}
+
+// Sort the array into increasing ordered array based on the virtual address.
+// Return vector of pointers to the elements in the incoming array. So caller
+// should make sure the returned vector lives longer than the incoming vector.
+template<class Container>
+static std::vector<typename Container::value_type* > SortByAddress(
+ Container* container) {
+ typedef typename Container::iterator It;
+ typedef typename Container::value_type T;
+ std::vector<T* > sorted_array_ptr;
+ sorted_array_ptr.reserve(container->size());
+ for (It it = container->begin(); it != container->end(); it++)
+ sorted_array_ptr.push_back(&(*it));
+ std::sort(sorted_array_ptr.begin(),
+ sorted_array_ptr.end(),
+ std::ptr_fun(CompareAddress<T, T>));
+
+ return sorted_array_ptr;
+}
+
+// Find the address of the next function or source file symbol in the symbol
+// table. The address should be bigger than the current function's address.
+static ElfW(Addr) NextAddress(
+ std::vector<struct FuncInfo* >* sorted_functions,
+ std::vector<struct SourceFileInfo* >* sorted_files,
+ const struct FuncInfo& func_info) {
+ std::vector<struct FuncInfo* >::iterator next_func_iter =
+ std::find_if(sorted_functions->begin(),
+ sorted_functions->end(),
+ std::bind1st(
+ std::ptr_fun(
+ CompareAddress<struct FuncInfo,
+ struct FuncInfo>),
+ &func_info));
+ if (next_func_iter != sorted_functions->end())
+ return (*next_func_iter)->addr;
+
+ std::vector<struct SourceFileInfo* >::iterator next_file_iter =
+ std::find_if(sorted_files->begin(),
+ sorted_files->end(),
+ std::bind1st(
+ std::ptr_fun(
+ CompareAddress<struct FuncInfo,
+ struct SourceFileInfo>),
+ &func_info));
+ if (next_file_iter != sorted_files->end()) {
+ return (*next_file_iter)->addr;
+ }
+ return 0;
+}
+
+static int FindFileByNameIdx(uint32_t name_index,
+ SourceFileInfoList& files) {
+ for (SourceFileInfoList::iterator it = files.begin();
+ it != files.end(); it++) {
+ if (it->name_index == name_index)
+ return it->source_id;
+ }
+
+ return -1;
+}
+
+// Add included file information.
+// Also fix the source id for the line info.
+static void AddIncludedFiles(struct SymbolInfo* symbols,
+ const ElfW(Shdr)* stabstr_section) {
+ for (SourceFileInfoList::iterator source_file_it =
+ symbols->source_file_info.begin();
+ source_file_it != symbols->source_file_info.end();
+ ++source_file_it) {
+ struct SourceFileInfo& source_file = *source_file_it;
+
+ for (FuncInfoList::iterator func_info_it = source_file.func_info.begin();
+ func_info_it != source_file.func_info.end();
+ ++func_info_it) {
+ struct FuncInfo& func_info = *func_info_it;
+
+ for (LineInfoList::iterator line_info_it = func_info.line_info.begin();
+ line_info_it != func_info.line_info.end(); ++line_info_it) {
+ struct LineInfo& line_info = *line_info_it;
+
+ assert(line_info.source_name_index > 0);
+ assert(source_file.name_index > 0);
+
+ // Check if the line belongs to the source file by comparing the
+ // name index into string table.
+ if (line_info.source_name_index != source_file.name_index) {
+ // This line is not from the current source file, check if this
+ // source file has been added before.
+ int found_source_id = FindFileByNameIdx(line_info.source_name_index,
+ symbols->source_file_info);
+ if (found_source_id < 0) {
+ // Got a new included file.
+ // Those included files don't have address or line information.
+ SourceFileInfo new_file;
+ new_file.name_index = line_info.source_name_index;
+ new_file.name =
+ reinterpret_cast<char* >(new_file.name_index +
+ stabstr_section->sh_offset);
+ new_file.addr = 0;
+ new_file.source_id = symbols->next_source_id++;
+ line_info.source_id = new_file.source_id;
+ symbols->source_file_info.push_back(new_file);
+ } else {
+ // The file has been added.
+ line_info.source_id = found_source_id;
+ }
+ } else {
+ // The line belongs to the file.
+ line_info.source_id = source_file.source_id;
+ }
+ } // for each line.
+ } // for each function.
+ } // for each source file.
+}
+
+// Compute size and rva information based on symbols loaded from stab section.
+static bool ComputeSizeAndRVA(ElfW(Addr) loading_addr,
+ struct SymbolInfo* symbols) {
+ std::vector<struct SourceFileInfo* > sorted_files =
+ SortByAddress(&(symbols->source_file_info));
+ for (size_t i = 0; i < sorted_files.size(); ++i) {
+ struct SourceFileInfo& source_file =* sorted_files[i];
+ std::vector<struct FuncInfo* > sorted_functions =
+ SortByAddress(&(source_file.func_info));
+ for (size_t j = 0; j < sorted_functions.size(); ++j) {
+ struct FuncInfo& func_info = *sorted_functions[j];
+ assert(func_info.addr >= loading_addr);
+ func_info.rva_to_base = func_info.addr - loading_addr;
+ func_info.size = 0;
+ ElfW(Addr) next_addr = NextAddress(&sorted_functions,
+ &sorted_files,
+ func_info);
+ // I've noticed functions with an address bigger than any other functions
+ // and source files modules, this is probably the last function in the
+ // module, due to limitions of Linux stab symbol, it is impossible to get
+ // the exact size of this kind of function, thus we give it a default
+ // very big value. This should be safe since this is the last function.
+ // But it is a ugly hack.....
+ // The following code can reproduce the case:
+ // template<class T>
+ // void Foo(T value) {
+ // }
+ //
+ // int main(void) {
+ // Foo(10);
+ // Foo(std::string("hello"));
+ // return 0;
+ // }
+ // TODO(liuli): Find a better solution.
+ static const int kDefaultSize = 0x10000000;
+ static int no_next_addr_count = 0;
+ if (next_addr != 0) {
+ func_info.size = next_addr - func_info.addr;
+ } else {
+ if (no_next_addr_count > 1) {
+ fprintf(stderr, "Got more than one function without the following ");
+ fprintf(stderr, "symbol. Ignore this function.\n");
+ fprintf(stderr, "The dumped symbol may not correct.\n");
+ assert(!"This should not happen!\n");
+ func_info.size = 0;
+ continue;
+ }
+
+ no_next_addr_count++;
+ func_info.size = kDefaultSize;
+ }
+ // Compute line size.
+ for (LineInfoList::iterator line_info_it = func_info.line_info.begin();
+ line_info_it != func_info.line_info.end(); line_info_it++) {
+ struct LineInfo& line_info = *line_info_it;
+ LineInfoList::iterator next_line_info_it = line_info_it;
+ next_line_info_it++;
+ line_info.size = 0;
+ if (next_line_info_it != func_info.line_info.end()) {
+ line_info.size =
+ next_line_info_it->rva_to_func - line_info.rva_to_func;
+ } else {
+ // The last line in the function.
+ // If we can find a function or source file symbol immediately
+ // following the line, we can get the size of the line by computing
+ // the difference of the next address to the starting address of this
+ // line.
+ // Otherwise, we need to set a default big enough value. This occurs
+ // mostly because the this function is the last one in the module.
+ if (next_addr != 0) {
+ ElfW(Off) next_addr_offset = next_addr - func_info.addr;
+ line_info.size = next_addr_offset - line_info.rva_to_func;
+ } else {
+ line_info.size = kDefaultSize;
+ }
+ }
+ line_info.rva_to_base = line_info.rva_to_func + func_info.rva_to_base;
+ } // for each line.
+ } // for each function.
+ } // for each source file.
+ return true;
+}
+
+static bool LoadSymbols(const ElfW(Shdr)* stab_section,
+ const ElfW(Shdr)* stabstr_section,
+ ElfW(Addr) loading_addr,
+ struct SymbolInfo* symbols) {
+ if (stab_section == NULL || stabstr_section == NULL)
+ return false;
+
+ struct nlist* lists =
+ reinterpret_cast<struct nlist* >(stab_section->sh_offset);
+ int nstab = stab_section->sh_size / sizeof(struct nlist);
+ // First pass, load all symbols from the object file.
+ for (int i = 0; i < nstab;) {
+ int step = 1;
+ struct nlist* cur_list = lists + i;
+ if (cur_list->n_type == N_SO) {
+ // FUNC <address> <length> <param_stack_size> <function>
+ struct SourceFileInfo source_file_info;
+ source_file_info.name_index = cur_list->n_un.n_strx;
+ source_file_info.name = reinterpret_cast<char* >(cur_list->n_un.n_strx +
+ stabstr_section->sh_offset);
+ source_file_info.addr = cur_list->n_value;
+ if (strchr(source_file_info.name, '.'))
+ source_file_info.source_id = symbols->next_source_id++;
+ else
+ source_file_info.source_id = -1;
+ step = LoadFuncSymbols(cur_list, lists + nstab,
+ stabstr_section, &source_file_info);
+ symbols->source_file_info.push_back(source_file_info);
+ }
+ i += step;
+ }
+
+ // Second pass, compute the size of functions and lines.
+ if (ComputeSizeAndRVA(loading_addr, symbols)) {
+ // Third pass, check for included source code, especially for header files.
+ // Until now, we only have compiling unit information, but they can
+ // have code from include files, add them here.
+ AddIncludedFiles(symbols, stabstr_section);
+ return true;
+ }
+ return false;
+}
+
+static bool LoadSymbols(ElfW(Ehdr)* elf_header, struct SymbolInfo* symbols) {
+ // Translate all offsets in section headers into address.
+ FixAddress(elf_header);
+ ElfW(Addr) loading_addr = GetLoadingAddress(
+ reinterpret_cast<ElfW(Phdr)* >(elf_header->e_phoff),
+ elf_header->e_phnum);
+
+ const ElfW(Shdr)* sections =
+ reinterpret_cast<ElfW(Shdr)* >(elf_header->e_shoff);
+ const ElfW(Shdr)* strtab = sections + elf_header->e_shstrndx;
+ const ElfW(Shdr)* stab_section =
+ FindSectionByName(kStabName, sections, strtab, elf_header->e_shnum);
+ if (stab_section == NULL) {
+ fprintf(stderr, "Stab section not found.\n");
+ return false;
+ }
+ const ElfW(Shdr)* stabstr_section = stab_section->sh_link + sections;
+
+ // Load symbols.
+ return LoadSymbols(stab_section, stabstr_section, loading_addr, symbols);
+}
+
+static bool WriteModuleInfo(int fd,
+ ElfW(Half) arch,
+ const std::string& obj_file) {
+ const char* arch_name = NULL;
+ if (arch == EM_386)
+ arch_name = "x86";
+ else if (arch == EM_X86_64)
+ arch_name = "x86_64";
+ else
+ return false;
+
+ uint8_t identifier[google_breakpad::kMDGUIDSize];
+ google_breakpad::FileID file_id(obj_file.c_str());
+ if (file_id.ElfFileIdentifier(identifier)) {
+ char identifier_str[40];
+ file_id.ConvertIdentifierToString(identifier,
+ identifier_str, sizeof(identifier_str));
+ char id_no_dash[40];
+ int id_no_dash_len = 0;
+ memset(id_no_dash, 0, sizeof(id_no_dash));
+ for (int i = 0; identifier_str[i] != '\0'; ++i)
+ if (identifier_str[i] != '-')
+ id_no_dash[id_no_dash_len++] = identifier_str[i];
+ // Add an extra "0" by the end.
+ id_no_dash[id_no_dash_len++] = '0';
+ std::string filename = obj_file;
+ size_t slash_pos = obj_file.find_last_of("/");
+ if (slash_pos != std::string::npos)
+ filename = obj_file.substr(slash_pos + 1);
+ return WriteFormat(fd, "MODULE Linux %s %s %s\n", arch_name,
+ id_no_dash, filename.c_str());
+ }
+ return false;
+}
+
+static bool WriteSourceFileInfo(int fd, const struct SymbolInfo& symbols) {
+ for (SourceFileInfoList::const_iterator it =
+ symbols.source_file_info.begin();
+ it != symbols.source_file_info.end(); it++) {
+ if (it->source_id != -1) {
+ const char* name = it->name;
+ if (!WriteFormat(fd, "FILE %d %s\n", it->source_id, name))
+ return false;
+ }
+ }
+ return true;
+}
+
+static bool WriteOneFunction(int fd,
+ const struct FuncInfo& func_info) {
+ // Discard the ending part of the name.
+ std::string func_name(func_info.name);
+ std::string::size_type last_colon = func_name.find_last_of(':');
+ if (last_colon != std::string::npos)
+ func_name = func_name.substr(0, last_colon);
+ func_name = Demangle(func_name.c_str());
+
+ if (func_info.size <= 0)
+ return true;
+
+ if (WriteFormat(fd, "FUNC %lx %lx %d %s\n",
+ func_info.rva_to_base,
+ func_info.size,
+ func_info.stack_param_size,
+ func_name.c_str())) {
+ for (LineInfoList::const_iterator it = func_info.line_info.begin();
+ it != func_info.line_info.end(); it++) {
+ const struct LineInfo& line_info =* it;
+ if (!WriteFormat(fd, "%lx %lx %d %d\n",
+ line_info.rva_to_base,
+ line_info.size,
+ line_info.line_num,
+ line_info.source_id))
+ return false;
+ }
+ return true;
+ }
+ return false;
+}
+
+static bool WriteFunctionInfo(int fd, const struct SymbolInfo& symbols) {
+ for (SourceFileInfoList::const_iterator it =
+ symbols.source_file_info.begin();
+ it != symbols.source_file_info.end(); it++) {
+ const struct SourceFileInfo& file_info =* it;
+ for (FuncInfoList::const_iterator fiIt = file_info.func_info.begin();
+ fiIt != file_info.func_info.end(); fiIt++) {
+ const struct FuncInfo& func_info =* fiIt;
+ if (!WriteOneFunction(fd, func_info))
+ return false;
+ }
+ }
+ return true;
+}
+
+static bool DumpStabSymbols(int fd, const struct SymbolInfo& symbols) {
+ return WriteSourceFileInfo(fd, symbols) &&
+ WriteFunctionInfo(fd, symbols);
+}
+
+//
+// FDWrapper
+//
+// Wrapper class to make sure opened file is closed.
+//
+class FDWrapper {
+ public:
+ explicit FDWrapper(int fd) :
+ fd_(fd) {
+ }
+ ~FDWrapper() {
+ if (fd_ != -1)
+ close(fd_);
+ }
+ int get() {
+ return fd_;
+ }
+ int release() {
+ int fd = fd_;
+ fd_ = -1;
+ return fd;
+ }
+ private:
+ int fd_;
+};
+
+//
+// MmapWrapper
+//
+// Wrapper class to make sure mapped regions are unmapped.
+//
+class MmapWrapper {
+ public:
+ MmapWrapper(void* mapped_address, size_t mapped_size) :
+ base_(mapped_address), size_(mapped_size) {
+ }
+ ~MmapWrapper() {
+ if (base_ != NULL) {
+ assert(size_ > 0);
+ munmap(base_, size_);
+ }
+ }
+ void release() {
+ base_ = NULL;
+ size_ = 0;
+ }
+
+ private:
+ void* base_;
+ size_t size_;
+};
+
+} // namespace
+
+namespace google_breakpad {
+
+bool DumpSymbols::WriteSymbolFile(const std::string& obj_file,
+ int sym_fd) {
+ int obj_fd = open(obj_file.c_str(), O_RDONLY);
+ if (obj_fd < 0)
+ return false;
+ FDWrapper obj_fd_wrapper(obj_fd);
+ struct stat st;
+ if (fstat(obj_fd, &st) != 0 && st.st_size <= 0)
+ return false;
+ void* obj_base = mmap(NULL, st.st_size,
+ PROT_READ | PROT_WRITE, MAP_PRIVATE, obj_fd, 0);
+ if (obj_base == MAP_FAILED)
+ return false;
+ MmapWrapper map_wrapper(obj_base, st.st_size);
+ ElfW(Ehdr)* elf_header = reinterpret_cast<ElfW(Ehdr)* >(obj_base);
+ if (!IsValidElf(elf_header))
+ return false;
+ struct SymbolInfo symbols;
+ symbols.next_source_id = 0;
+
+ if (!LoadSymbols(elf_header, &symbols))
+ return false;
+ // Write to symbol file.
+ if (WriteModuleInfo(sym_fd, elf_header->e_machine, obj_file) &&
+ DumpStabSymbols(sym_fd, symbols))
+ return true;
+
+ return false;
+}
+
+} // namespace google_breakpad
diff --git a/breakpad/linux/dump_symbols.h b/breakpad/linux/dump_symbols.h
new file mode 100644
index 0000000..662b482
--- /dev/null
+++ b/breakpad/linux/dump_symbols.h
@@ -0,0 +1,47 @@
+// Copyright (c) 2006, 2009, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+// * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+// * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+// * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+//
+// dump_symbols.cc: Implements a linux stab debugging format dumper.
+//
+
+#ifndef BREAKPAD_LINUX_DUMP_SYMBOLS_H_
+#define BREAKPAD_LINUX_DUMP_SYMBOLS_H_
+
+#include <string>
+
+namespace google_breakpad {
+
+class DumpSymbols {
+ public:
+ static bool WriteSymbolFile(const std::string& obj_file, int sym_fd);
+};
+
+} // namespace google_breakpad
+
+#endif // BREAKPAD_LINUX_DUMP_SYMBOLS_H_
diff --git a/breakpad/linux/dump_syms.cc b/breakpad/linux/dump_syms.cc
new file mode 100644
index 0000000..2d90acd
--- /dev/null
+++ b/breakpad/linux/dump_syms.cc
@@ -0,0 +1,50 @@
+// Copyright (c) 2006, 2009, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+// * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+// * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+// * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#include <string>
+#include <cstdio>
+
+#include "breakpad/linux/dump_symbols.h"
+
+using google_breakpad::DumpSymbols;
+
+int main(int argc, char** argv) {
+ if (argc != 2) {
+ fprintf(stderr, "Usage: %s <binary-with-stab-symbol>\n", argv[0]);
+ return 1;
+ }
+
+ DumpSymbols dumper;
+ if (!dumper.WriteSymbolFile(argv[1], fileno(stdout))) {
+ fprintf(stderr, "Failed to write symbol file.\n");
+ return 1;
+ }
+
+ return 0;
+}
diff --git a/breakpad/linux/file_id.cc b/breakpad/linux/file_id.cc
new file mode 100644
index 0000000..5ba955b
--- /dev/null
+++ b/breakpad/linux/file_id.cc
@@ -0,0 +1,103 @@
+// Copyright (c) 2006, 2009, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+// * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+// * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+// * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+//
+// file_id.cc: Return a unique identifier for a file
+//
+// See file_id.h for documentation
+//
+
+#include "breakpad/linux/file_id.h"
+
+#include <elf.h>
+#include <fcntl.h>
+#include <link.h>
+#include <string.h>
+#include <sys/mman.h>
+#include <unistd.h>
+
+#include <cassert>
+#include <cstdio>
+
+namespace google_breakpad {
+
+FileID::FileID(const char* path) {
+ strncpy(path_, path, sizeof(path_));
+}
+
+bool FileID::ElfFileIdentifier(uint8_t identifier[kMDGUIDSize]) {
+ const size_t mapped_len = 4096; // Page size (matches WriteMappings())
+ int fd = open(path_, O_RDONLY);
+ if (fd < 0)
+ return false;
+ struct stat st;
+ if (fstat(fd, &st) != 0 || st.st_size <= mapped_len) {
+ close(fd);
+ return false;
+ }
+ void* base = mmap(NULL, mapped_len,
+ PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
+ close(fd);
+ if (base == MAP_FAILED)
+ return false;
+
+ memset(identifier, 0, kMDGUIDSize);
+ uint8_t* ptr = reinterpret_cast<uint8_t*>(base);
+ uint8_t* ptr_end = ptr + mapped_len;
+ while (ptr < ptr_end) {
+ for (unsigned i = 0; i < kMDGUIDSize; i++)
+ identifier[i] ^= ptr[i];
+ ptr += kMDGUIDSize;
+ }
+
+ munmap(base, mapped_len);
+ return true;
+}
+
+// static
+void FileID::ConvertIdentifierToString(const uint8_t identifier[kMDGUIDSize],
+ char* buffer, int buffer_length) {
+ int buffer_idx = 0;
+ for (int idx = 0;
+ (buffer_idx < buffer_length) && (idx < kMDGUIDSize);
+ ++idx) {
+ int hi = (identifier[idx] >> 4) & 0x0F;
+ int lo = (identifier[idx]) & 0x0F;
+
+ if (idx == 4 || idx == 6 || idx == 8 || idx == 10)
+ buffer[buffer_idx++] = '-';
+
+ buffer[buffer_idx++] = (hi >= 10) ? 'A' + hi - 10 : '0' + hi;
+ buffer[buffer_idx++] = (lo >= 10) ? 'A' + lo - 10 : '0' + lo;
+ }
+
+ // NULL terminate
+ buffer[(buffer_idx < buffer_length) ? buffer_idx : buffer_idx - 1] = 0;
+}
+
+} // namespace google_breakpad
diff --git a/breakpad/linux/file_id.h b/breakpad/linux/file_id.h
new file mode 100644
index 0000000..1504fa2
--- /dev/null
+++ b/breakpad/linux/file_id.h
@@ -0,0 +1,70 @@
+// Copyright (c) 2006, 2009, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+// * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+// * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+// * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+//
+// file_id.h: Return a unique identifier for a file
+//
+
+#ifndef BREAKPAD_LINUX_FILE_ID_H_
+#define BREAKPAD_LINUX_FILE_ID_H_
+
+#include <limits.h>
+
+#include "common/linux/guid_creator.h"
+
+namespace google_breakpad {
+
+static const size_t kMDGUIDSize = sizeof(MDGUID);
+
+class FileID {
+ public:
+ explicit FileID(const char* path);
+ ~FileID() {}
+
+ // Load the identifier for the elf file path specified in the constructor into
+ // |identifier|. Return false if the identifier could not be created for the
+ // file.
+ // The current implementation will XOR the first page of data to generate an
+ // identifier.
+ bool ElfFileIdentifier(uint8_t identifier[kMDGUIDSize]);
+
+ // Convert the |identifier| data to a NULL terminated string. The string will
+ // be formatted as a UUID (e.g., 22F065BB-FC9C-49F7-80FE-26A7CEBD7BCE).
+ // The |buffer| should be at least 37 bytes long to receive all of the data
+ // and termination. Shorter buffers will contain truncated data.
+ static void ConvertIdentifierToString(const uint8_t identifier[kMDGUIDSize],
+ char* buffer, int buffer_length);
+
+ private:
+ // Storage for the path specified
+ char path_[PATH_MAX];
+};
+
+} // namespace google_breakpad
+
+#endif // BREAKPAD_LINUX_FILE_ID_H_