#!/usr/bin/env python
#
# Copyright 2013 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
"""Symbolizes stack traces generated by Chromium for Android.
Sample usage:
adb logcat chromium:V | symbolize.py
"""
import os
import re
import sys
from pylib import constants
# Uses symbol.py from third_party/android_platform, not python's.
sys.path.insert(0,
os.path.join(constants.DIR_SOURCE_ROOT,
'third_party/android_platform/development/scripts'))
import symbol
# Sample output from base/debug/stack_trace_android.cc
#00 0x693cd34f /path/to/some/libfoo.so+0x0007434f
TRACE_LINE = re.compile('(?P\#[0-9]+ 0x[0-9a-f]{8,8}) '
'(?P[^+]+)\+0x(?P[0-9a-f]{8,8})')
class Symbolizer(object):
def __init__(self, output):
self._output = output
def write(self, data):
while True:
match = re.search(TRACE_LINE, data)
if not match:
self._output.write(data)
break
frame = match.group('frame')
lib = match.group('lib')
addr = match.group('addr')
# TODO(scherkus): Doing a single lookup per line is pretty slow,
# especially with larger libraries. Consider caching strategies such as:
# 1) Have Python load the libraries and do symbol lookups instead of
# calling out to addr2line each time.
# 2) Have Python keep multiple addr2line instances open as subprocesses,
# piping addresses and reading back symbols as we find them
# 3) Read ahead the entire stack trace until we find no more, then batch
# the symbol lookups.
#
# TODO(scherkus): These results are memoized, which could result in
# incorrect lookups when running this script on long-lived instances
# (e.g., adb logcat) when doing incremental development. Consider clearing
# the cache when modification timestamp of libraries change.
sym = symbol.SymbolInformation(lib, addr, False)[0][0]
if not sym:
post = match.end('addr')
self._output.write(data[:post])
data = data[post:]
continue
pre = match.start('frame')
post = match.end('addr')
self._output.write(data[:pre])
self._output.write(frame)
self._output.write(' ')
self._output.write(sym)
data = data[post:]
def flush(self):
self._output.flush()
def main():
symbolizer = Symbolizer(sys.stdout)
for line in sys.stdin:
symbolizer.write(line)
symbolizer.flush()
if __name__ == '__main__':
main()