#! /usr/bin/env python
# -*- coding: iso-8859-1 -*- #
# Copyright, license and disclaimer are at the end of this file.
'''Usage: backtrace2line <backtrace_file> [<src_dir> ...]
This program adds the source file name and line number to stack
traces generated by Linux' function backtrace_symbols_fd.
Each stack frame line**) in the input file originating from the
function backtrace_symbols_fd is extended with the file name and
line number returned by utility addr2line. All other lines from
the input file remain unchanged.
However, line numbers returned by addr2line are often inaccurate
and typically too high. If any <src_dir> arguments are supplied
on the command line, the line numbers from addr2line may be
adjusted after searching the source file for the nearest lines
containing the symbol. Adjusted line numbers are marked with *.
Symbol search is simplistic. Code and comment lines in source
files are searched within a limited range around the line number
returned by addr2line.
Example of an stack trace obtained from an instrumented Python
2.5.1 binary (abbreviated), before
/Python-2.5.1/python(PyObject_Free+0x15b)[0x8088b07]
/Python-2.5.1/python(PyDict_SetItem+0x1a6)[0x80824ae]
/Python-2.5.1/python(_PyModule_Clear+0x146)[0x80854ca]
/Python-2.5.1/python(PyImport_Cleanup+0x291)[0x80d6b25]
/Python-2.5.1/python(Py_Finalize+0xaf)[0x80e3b53]
/Python-2.5.1/python(Py_Main+0x30b)[0x80565d7]
/Python-2.5.1/python(main+0x17)[0x80562c7]
after backtrace2line
/Python-2.5.1/python(PyObject_Free+0x15b)[0x8088b07] Objects/obmalloc.c:1123
/Python-2.5.1/python(PyDict_SetItem+0x1a6)[0x80824ae] Objects/dictobject.c:412
/Python-2.5.1/python(_PyModule_Clear+0x146)[0x80854ca] Objects/moduleobject.c:136
/Python-2.5.1/python(PyImport_Cleanup+0x291)[0x80d6b25] Python/import.c:469
/Python-2.5.1/python(Py_Finalize+0xaf)[0x80e3b53] Python/pythonrun.c:419
/Python-2.5.1/python(Py_Main+0x30b)[0x80565d7] Modules/main.c:565
/Python-2.5.1/python(main+0x17)[0x80562c7] ./Modules/python.c:24
after backtrace2line ... with <src_dir> adjusting several line numbers
/Python-2.5.1/python(PyObject_Free+0x15b)[0x8088b07] Objects/obmalloc.c:1123
/Python-2.5.1/python(PyDict_SetItem+0x1a6)[0x80824ae] Objects/dictobject.c:412
/Python-2.5.1/python(_PyModule_Clear+0x146)[0x80854ca] Objects/moduleobject.c:136*
/Python-2.5.1/python(PyImport_Cleanup+0x291)[0x80d6b25] Python/import.c:468*
/Python-2.5.1/python(Py_Finalize+0xaf)[0x80e3b53] Python/pythonrun.c:397*
/Python-2.5.1/python(Py_Main+0x30b)[0x80565d7] Modules/main.c:545*
/Python-2.5.1/python(main+0x17)[0x80562c7] ./Modules/python.c:23*
----
*) Stack frames from backtrace_symbols_fd are listed in order
most-recently-called-first, i.e. main is near the bottom
of each backtrace list.
**) Stack frame lines from backtrace_sybols_fd have one of
the following three formats:
<path>(<function>*0x<offset>)[0x<address>]
or
<path>[0x<address>]
or
[0x<address>]
where * means + or -. Only frames starting with a <path>
can be extended with a file name and line number and only
frames containing a <function> can be adjusted.
'''
__version__ = '1.2 (Dec 20, 2010)'
import os, sys
class _Frame(object):
'''Stack frame object.
'''
addr = '' # address string, 0x...
call = None # frame called
file = '' # source file name
line = '' # source line number string
lino = 0 # line number in original, input file
name = '' # function name/symbol iff present
path = '' # library or executable path
def __init__(self, text, lino=0, call=None, skip=None):
b = text.rfind('[0x')
if b > 0:
# get address
a = text[b:].rstrip()
if a.endswith(']') and len(a) <= 20: # 64-bit
# save in frame
self.addr = a[1:-1]
self.call = call
self.lino = lino
if skip: # till start of path
a = text.find(skip, 0, b) + 1
else:
a = 0
# get path till '(' iff present
if text[b-1] == ')':
p = text.find('(', a, b)
if p > a:
self.path = text[a:p]
# get function till offset
f = text.find('0x', p, b) - 1
if f > 0 and (text[f] == '+' or text[f] == '-'):
self.name = text[p+1:f]
else:
self.path = text[a:b]
_ARG_MAX = 256 # some limit for addr2line
def _addr2line(path, *args):
'''Return list of filename:linenumbers for
address(es) in a library or executable.
'''
# global _addr2line_bin
r, a = [], args
# recurse for long lists
if len(a) > _ARG_MAX:
r = _addr2line(path, *a[:_ARG_MAX])
a = a[_ARG_MAX:]
# _addr2line_bin prints one filename:linenumber
# line per address or '??:0' in case of errors
t = "%s -e %s %s" % (_addr2line_bin, path, ' '.join(a))
try:
p = os.popen(t)
r.extend(p.readlines())
p.close()
except:
_print("%.*s... (%d) failed", 80,t, len(a))
return []
if len(r) != len(args):
_print("%.*s... mismatch: %d vs %d", 80,t, len(r), len(args))
return r
def _adjust(frames, srcpath):
'''For each frame, find the function called in the
source file near the line number from addr2line
and if found adjust the line number accordingly.
'''
def _cmp(f1, f2):
if f1.file < f2.file:
return -1
if f1.file > f2.file:
return +1
return 0
# sort frames by file
frames.sort(_cmp)
# cache source lines
p, t, r = '', [], 0
for f in frames:
if f.call and f.call.name and f.file != '??':
# get source file as lines
p, t = _source(_which(f.file, srcpath), p, t)
if t: # find nearest line(s)
n = _search(f.call.name, t, int(f.line.rstrip()))
if n: # adjust frame line
f.line = '+'.join([str(i) for i in n]) + '*' + os.linesep
r += len(n)
return r # number of adjustments
def _backtrace2line(name, ldpath=None, srcpath=None):
'''Get a backtrace file and use addr2line
on every stack frame line in that file,
with adjusted line number if requested.
'''
try:
f = open(name, 'rt')
ts = f.readlines()
f.close()
except:
_print("open failed: %r", name)
return # None
# skip till start of path
s = ' ' + os.path.sep
# create a _Frame instance for each stack
# frame line and collect all _Frames of a
# library or executable in a separate list
pfs, f = {}, None
for i, t in enumerate(ts):
f = _Frame(t, i, f, skip=s)
p = f.path
if p in pfs:
pfs[p].append(f)
elif p:
pfs[p] = [f,]
else: # not a <path> frame
f = None
# for each library or executable, get a list
# of addresses, pass those to add2line, save
# the file name and (adjusted) line number in
# the _Frame and append the final result to
# the original line of the input file
r = 0
for p, fs in pfs.iteritems():
p = _which(p, ldpath)
if p:
a = [f.addr for f in fs]
s = _addr2line(p, *a)
if s:
for i, f in enumerate(fs):
f.file, f.line = s[i].split(':')
if srcpath:
r += _adjust(fs, srcpath)
for f in fs:
i = f.lino
t = ts[i].rstrip() # line break
ts[i] = t + ' ' + f.file + ':' + f.line
##_print("%d adjusted line numbers*", r)
return ''.join(ts) # as string
def _print(fmt, *args):
'''Print a message.
'''
print "%s: %s" % (sys.argv[0], (fmt % args))
def _search(name, text, line, before=32, after=16):
'''Find name in text lines within a range
before and after a given line number.
'''
b = max(line - max(0, before), 1) # 1-origin
a = min(line + max(0, after), len(text))
r = [] # search back- and forward
for n, s in [(line, -1), (line+1, +1)]:
while b <= n <= a:
if text[n-1].find(name) < 0:
n += s
else:
r.append(n)
break # while
return r # list of 0, 1 or 2 line numbers
def _source(path, prev, text):
'''Get source lines of a source file
iff different from the previous one.
'''
if path == prev:
t = text
elif path:
try:
f = open(path, 'rt')
t = f.readlines()
f.close()
except:
t = []
else:
t = []
return (path, t)
def _which(name, PATH=None, exit=0):
'''Find fully qualified path for a file.
'''
n = os.path.expanduser(name)
if os.path.isabs(n):
return n
p = PATH or os.environ.get('PATH', '')
for d in p.split(os.pathsep):
f = os.path.join(d, n)
if os.path.isfile(f):
return f
if exit:
_print("utility %r missing", name)
sys.exit(exit)
return None
_addr2line_bin = _which('addr2line', exit=os.EX_OSFILE)
if __name__ == '__main__':
argc = len(sys.argv)
if argc < 2 or sys.argv[1].startswith('-'):
_print("usage: %s <backtrace_file> [<src_dir> ...]", os.path.basename(sys.argv[0]))
sys.exit(os.EX_USAGE)
# default library path
ldp = '/usr/local/lib:/usr/lib:/lib'
if sys.platform.startswith('darwin'):
ldp = os.environ.get('DYLD_LIBRARY_PATH',
os.environ.get('DYLD_FALLBACK_LIBRARY_PATH', ldp))
else: # assume *nix
ldp = os.environ.get('LD_LIBRARY_PATH', ldp)
if argc > 2: # check src_dirs
ds = sys.argv[2:]
for d in ds:
if not os.path.isdir(d):
_print("not a directory: %r", d)
sys.exit(os.EX_OSFILE)
print _backtrace2line(sys.argv[1], ldp, os.pathsep.join(ds))
else:
print _backtrace2line(sys.argv[1], ldp, None)
#---------------------------------------------------------------------
# Copyright (c) 2007-2010 -- Jean Brouwers. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
#
# - Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
#
# - Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in
# the documentation and/or other materials provided with the
# distribution.
#
# - Neither the name Jean Brouwers nor the names of any of the
# contributors may be used to endorse or promote products derived
# from this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
# COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
# (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
# STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
# OF THE POSSIBILITY OF SUCH DAMAGE.
#---------------------------------------------------------------------
Diff to Previous Revision
--- revision 2 2008-02-22 19:42:34
+++ revision 3 2010-12-20 06:57:29
@@ -74,7 +74,7 @@
frames containing a <function> can be adjusted.
'''
-__version__ = '1.1 (Jan 08, 2008)'
+__version__ = '1.2 (Dec 20, 2010)'
import os, sys
@@ -282,7 +282,7 @@
# default library path
ldp = '/usr/local/lib:/usr/lib:/lib'
- if sys.platform == 'darwin':
+ if sys.platform.startswith('darwin'):
ldp = os.environ.get('DYLD_LIBRARY_PATH',
os.environ.get('DYLD_FALLBACK_LIBRARY_PATH', ldp))
else: # assume *nix
@@ -301,7 +301,7 @@
#---------------------------------------------------------------------
-# Copyright (c) 2007-2008 -- Jean Brouwers. All rights reserved.
+# Copyright (c) 2007-2010 -- Jean Brouwers. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions