blob: 14ec5bf5a709877d21a332716de0bbee1464fc7e [file] [log] [blame]
#!/usr/bin/env python
#===- lib/asan/scripts/asan_symbolize.py -----------------------------------===#
#
# The LLVM Compiler Infrastructure
#
# This file is distributed under the University of Illinois Open Source
# License. See LICENSE.TXT for details.
#
#===------------------------------------------------------------------------===#
import os
import re
import sys
import string
import subprocess
pipes = {}
filetypes = {}
DEBUG=False
def patch_address(frameno, addr_s):
''' Subtracts 1 or 2 from the top frame's address.
Top frame is normally the return address from asan_report*
call, which is not expected to return at all. Because of that, this
address often belongs to the next source code line, or even to a different
function. '''
if frameno == '0':
addr = int(addr_s, 16)
if os.uname()[4].startswith('arm'):
# Cancel the Thumb bit
addr = addr & (~1)
addr -= 1
return hex(addr)
return addr_s
def fix_filename(file_name):
for path_to_cut in sys.argv[1:]:
file_name = re.sub(".*" + path_to_cut, "", file_name)
file_name = re.sub(".*asan_[a-z_]*.cc:[0-9]*", "_asan_rtl_", file_name)
file_name = re.sub(".*crtstuff.c:0", "???:0", file_name)
return file_name
# TODO(glider): need some refactoring here
def symbolize_addr2line(line):
#0 0x7f6e35cf2e45 (/blah/foo.so+0x11fe45)
match = re.match('^( *#([0-9]+) *0x[0-9a-f]+) *\((.*)\+(0x[0-9a-f]+)\)', line)
if match:
frameno = match.group(2)
binary = match.group(3)
addr = match.group(4)
addr = patch_address(frameno, addr)
if not pipes.has_key(binary):
pipes[binary] = subprocess.Popen(["addr2line", "-f", "-e", binary],
stdin=subprocess.PIPE, stdout=subprocess.PIPE)
p = pipes[binary]
try:
print >>p.stdin, addr
function_name = p.stdout.readline().rstrip()
file_name = p.stdout.readline().rstrip()
except:
function_name = ""
file_name = ""
file_name = fix_filename(file_name)
print match.group(1), "in", function_name, file_name
else:
print line.rstrip()
def get_macho_filetype(binary):
if not filetypes.has_key(binary):
otool_pipe = subprocess.Popen(["otool", "-Vh", binary],
stdin=subprocess.PIPE, stdout=subprocess.PIPE)
otool_line = "".join(otool_pipe.stdout.readlines())
for t in ["DYLIB", "EXECUTE"]:
if t in otool_line:
filetypes[binary] = t
otool_pipe.stdin.close()
return filetypes[binary]
def symbolize_atos(line):
#0 0x7f6e35cf2e45 (/blah/foo.so+0x11fe45)
match = re.match('^( *#([0-9]+) *)(0x[0-9a-f]+) *\((.*)\+(0x[0-9a-f]+)\)', line)
if match:
#print line
prefix = match.group(1)
frameno = match.group(2)
orig_addr = match.group(3)
binary = match.group(4)
offset = match.group(5)
addr = patch_address(frameno, orig_addr)
load_addr = hex(int(orig_addr, 16) - int(offset, 16))
filetype = get_macho_filetype(binary)
if not pipes.has_key(binary):
# Guess which arch we're running. 10 = len("0x") + 8 hex digits.
if len(addr) > 10:
arch = "x86_64"
else:
arch = "i386"
if filetype == "DYLIB":
load_addr = "0x0"
if DEBUG:
print "atos -o %s -arch %s -l %s" % (binary, arch, load_addr)
cmd = ["atos", "-o", binary, "-arch", arch, "-l", load_addr]
pipes[binary] = subprocess.Popen(cmd,
stdin=subprocess.PIPE,
stdout=subprocess.PIPE,
stderr=subprocess.PIPE)
p = pipes[binary]
if filetype == "DYLIB":
print >>p.stdin, "%s" % offset
else:
print >>p.stdin, "%s" % addr
# TODO(glider): it's more efficient to make a batch atos run for each binary.
p.stdin.close()
atos_line = p.stdout.readline().rstrip()
# A well-formed atos response looks like this:
# foo(type1, type2) (in object.name) (filename.cc:80)
match = re.match('^(.*) \(in (.*)\) \((.*:\d*)\)$', atos_line)
#print "atos_line: ", atos_line
if match:
function_name = match.group(1)
function_name = re.sub("\(.*?\)", "", function_name)
file_name = fix_filename(match.group(3))
print "%s%s in %s %s" % (prefix, addr, function_name, file_name)
else:
print "%s%s in %s" % (prefix, addr, atos_line)
del pipes[binary]
else:
print line.rstrip()
system = os.uname()[0]
if system in ['Linux', 'Darwin']:
for line in sys.stdin:
if system == 'Linux':
symbolize_addr2line(line)
elif system == 'Darwin':
symbolize_atos(line)
else:
print 'Unknown system: ', system