#!/usr/bin/env python #===- lib/asan/scripts/asan_symbolize.py -----------------------------------===# # # The LLVM Compiler Infrastructure # # This file is distributed under the University of Illinois Open Source # License. See LICENSE.TXT for details. # #===------------------------------------------------------------------------===# import glob import os import re import sys import string import subprocess pipes = {} load_addresses = {} next_inline_frameno = 0 def patch_address(frameno, addr_s): ''' Subtracts 1 or 2 from the top frame's address. Top frame is normally the return address from asan_report* call, which is not expected to return at all. Because of that, this address often belongs to the next source code line, or even to a different function. ''' if frameno == '0': addr = int(addr_s, 16) if os.uname()[4].startswith('arm'): # Cancel the Thumb bit addr = addr & (~1) addr -= 1 return hex(addr) return addr_s def android_get_load_address(path): if load_addresses.has_key(path): return load_addresses[path] readelf_glob = os.path.join(os.environ['ANDROID_TOOLCHAIN'], '*-readelf') readelf = glob.glob(readelf_glob)[0] readelf_pipe = subprocess.Popen([readelf, "-l", path], stdin=subprocess.PIPE, stdout=subprocess.PIPE) for line in readelf_pipe.stdout: if ('LOAD' in line) and (' E ' in line): match = re.match(r'\s*LOAD\s+0x[01-9a-zA-Z]+\s+(0x[01-9a-zA-Z]+)', line, re.UNICODE) if match: load_addr = int(match.group(1), 16) load_addresses[path] = load_addr return load_addr else: break print 'Could not make sense of readelf output!' sys.exit(1) def postprocess_file_name(file_name, paths_to_cut): for path_to_cut in paths_to_cut: file_name = re.sub(".*" + path_to_cut, "", file_name) file_name = re.sub(".*asan_[a-z_]*.(cc|h):[0-9]*", "[asan_rtl]", file_name) file_name = re.sub(".*crtstuff.c:0", "???:0", file_name) return file_name # TODO(glider): need some refactoring here def symbolize_addr2line(line, binary_prefix, paths_to_cut): global next_inline_frameno # Strip the log prefix ("I/asanwrapper( 1196): "). line = re.sub(r'^.*?: ', '', line) #0 0x7f6e35cf2e45 (/blah/foo.so+0x11fe45) match = re.match(r'^(\s*#)([0-9]+) *(0x[0-9a-f]+) *\((.*)\+(0x[0-9a-f]+)\)', line, re.UNICODE) if match: frameno = match.group(2) binary = match.group(4) addr = match.group(5) addr = patch_address(frameno, addr) if binary.startswith('/'): binary = binary[1:] binary = os.path.join(binary_prefix, binary) if not os.path.exists(binary): print line.rstrip().encode('utf-8') return load_addr = android_get_load_address(binary) addr = hex(int(addr, 16) + load_addr) if not pipes.has_key(binary): pipes[binary] = subprocess.Popen(["addr2line", "-i", "-f", "-e", binary], stdin=subprocess.PIPE, stdout=subprocess.PIPE) p = pipes[binary] frames = [] try: print >>p.stdin, addr # This will trigger a "??" response from addr2line so we know when to stop print >>p.stdin while True: function_name = p.stdout.readline().rstrip() file_name = p.stdout.readline().rstrip() if function_name in ['??', '']: break file_name = postprocess_file_name(file_name, paths_to_cut) frames.append((function_name, file_name)) except: pass if not frames: frames.append(('', '')) # Consume another pair of "??" lines try: p.stdout.readline() p.stdout.readline() except: pass for frame in frames: inline_frameno = next_inline_frameno next_inline_frameno += 1 print "%s%d" % (match.group(1).encode('utf-8'), inline_frameno), \ match.group(3).encode('utf-8'), "in", frame[0], frame[1] else: print line.rstrip().encode('utf-8') binary_prefix = os.path.join(os.environ['ANDROID_PRODUCT_OUT'], 'symbols') paths_to_cut = [os.getcwd() + '/', os.environ['ANDROID_BUILD_TOP'] + '/'] + sys.argv[1:] for line in sys.stdin: line = line.decode('utf-8') symbolize_addr2line(line, binary_prefix, paths_to_cut)