#!/usr/bin/env python
#
# Copyright (C) 2015 The Android Open Source Project
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
"""Simpleperf runtest runner: run simpleperf runtests on host or on device.
For a simpleperf runtest like one_function test, it contains following steps:
1. Run simpleperf record command to record simpleperf_runtest_one_function's
running samples, which is generated in perf.data.
2. Run simpleperf report command to parse perf.data, generate perf.report.
4. Parse perf.report and see if it matches expectation.
The information of all runtests is stored in runtest.conf.
"""
import os
import os.path
import re
import subprocess
import sys
import xml.etree.ElementTree as ET
class CallTreeNode(object):
def __init__(self, name):
self.name = name
self.children = []
def add_child(self, child):
self.children.append(child)
def __str__(self):
return 'CallTreeNode:\n' + '\n'.join(self._dump(1))
def _dump(self, indent):
indent_str = ' ' * indent
strs = [indent_str + self.name]
for child in self.children:
strs.extend(child._dump(indent + 1))
return strs
class Symbol(object):
def __init__(self, name, comm, overhead, children_overhead):
self.name = name
self.comm = comm
self.overhead = overhead
# children_overhead is the overhead sum of this symbol and functions
# called by this symbol.
self.children_overhead = children_overhead
self.call_tree = None
def set_call_tree(self, call_tree):
self.call_tree = call_tree
def __str__(self):
strs = []
strs.append('Symbol name=%s comm=%s overhead=%f children_overhead=%f' % (
self.name, self.comm, self.overhead, self.children_overhead))
if self.call_tree:
strs.append('\t%s' % self.call_tree)
return '\n'.join(strs)
class SymbolOverheadRequirement(object):
def __init__(self, symbol_name=None, comm=None, min_overhead=None,
max_overhead=None):
self.symbol_name = symbol_name
self.comm = comm
self.min_overhead = min_overhead
self.max_overhead = max_overhead
def __str__(self):
strs = []
strs.append('SymbolOverheadRequirement')
if self.symbol_name is not None:
strs.append('symbol_name=%s' % self.symbol_name)
if self.comm is not None:
strs.append('comm=%s' % self.comm)
if self.min_overhead is not None:
strs.append('min_overhead=%f' % self.min_overhead)
if self.max_overhead is not None:
strs.append('max_overhead=%f' % self.max_overhead)
return ' '.join(strs)
def is_match(self, symbol):
if self.symbol_name is not None:
if self.symbol_name != symbol.name:
return False
if self.comm is not None:
if self.comm != symbol.comm:
return False
return True
def check_overhead(self, overhead):
if self.min_overhead is not None:
if self.min_overhead > overhead:
return False
if self.max_overhead is not None:
if self.max_overhead < overhead:
return False
return True
class SymbolRelationRequirement(object):
def __init__(self, symbol_name, comm=None):
self.symbol_name = symbol_name
self.comm = comm
self.children = []
def add_child(self, child):
self.children.append(child)
def __str__(self):
return 'SymbolRelationRequirement:\n' + '\n'.join(self._dump(1))
def _dump(self, indent):
indent_str = ' ' * indent
strs = [indent_str + self.symbol_name +
(' ' + self.comm if self.comm else '')]
for child in self.children:
strs.extend(child._dump(indent + 1))
return strs
def is_match(self, symbol):
if symbol.name != self.symbol_name:
return False
if self.comm is not None:
if symbol.comm != self.comm:
return False
return True
def check_relation(self, call_tree):
if not call_tree:
return False
if self.symbol_name != call_tree.name:
return False
for child in self.children:
child_matched = False
for node in call_tree.children:
if child.check_relation(node):
child_matched = True
break
if not child_matched:
return False
return True
class Test(object):
def __init__(
self,
test_name,
executable_name,
report_options,
symbol_overhead_requirements,
symbol_children_overhead_requirements,
symbol_relation_requirements):
self.test_name = test_name
self.executable_name = executable_name
self.report_options = report_options
self.symbol_overhead_requirements = symbol_overhead_requirements
self.symbol_children_overhead_requirements = (
symbol_children_overhead_requirements)
self.symbol_relation_requirements = symbol_relation_requirements
def __str__(self):
strs = []
strs.append('Test test_name=%s' % self.test_name)
strs.append('\texecutable_name=%s' % self.executable_name)
strs.append('\treport_options=%s' % (' '.join(self.report_options)))
strs.append('\tsymbol_overhead_requirements:')
for req in self.symbol_overhead_requirements:
strs.append('\t\t%s' % req)
strs.append('\tsymbol_children_overhead_requirements:')
for req in self.symbol_children_overhead_requirements:
strs.append('\t\t%s' % req)
strs.append('\tsymbol_relation_requirements:')
for req in self.symbol_relation_requirements:
strs.append('\t\t%s' % req)
return '\n'.join(strs)
def load_config_file(config_file):
tests = []
tree = ET.parse(config_file)
root = tree.getroot()
assert root.tag == 'runtests'
for test in root:
assert test.tag == 'test'
test_name = test.attrib['name']
executable_name = None
report_options = []
symbol_overhead_requirements = []
symbol_children_overhead_requirements = []
symbol_relation_requirements = []
for test_item in test:
if test_item.tag == 'executable':
executable_name = test_item.attrib['name']
elif test_item.tag == 'report':
report_options = test_item.attrib['option'].split()
elif (test_item.tag == 'symbol_overhead' or
test_item.tag == 'symbol_children_overhead'):
for symbol_item in test_item:
assert symbol_item.tag == 'symbol'
symbol_name = None
if 'name' in symbol_item.attrib:
symbol_name = symbol_item.attrib['name']
comm = None
if 'comm' in symbol_item.attrib:
comm = symbol_item.attrib['comm']
overhead_min = None
if 'min' in symbol_item.attrib:
overhead_min = float(symbol_item.attrib['min'])
overhead_max = None
if 'max' in symbol_item.attrib:
overhead_max = float(symbol_item.attrib['max'])
if test_item.tag == 'symbol_overhead':
symbol_overhead_requirements.append(
SymbolOverheadRequirement(
symbol_name,
comm,
overhead_min,
overhead_max)
)
else:
symbol_children_overhead_requirements.append(
SymbolOverheadRequirement(
symbol_name,
comm,
overhead_min,
overhead_max))
elif test_item.tag == 'symbol_callgraph_relation':
for symbol_item in test_item:
req = load_symbol_relation_requirement(symbol_item)
symbol_relation_requirements.append(req)
tests.append(
Test(
test_name,
executable_name,
report_options,
symbol_overhead_requirements,
symbol_children_overhead_requirements,
symbol_relation_requirements))
return tests
def load_symbol_relation_requirement(symbol_item):
symbol_name = symbol_item.attrib['name']
comm = None
if 'comm' in symbol_item.attrib:
comm = symbol_item.attrib['comm']
req = SymbolRelationRequirement(symbol_name, comm)
for item in symbol_item:
child_req = load_symbol_relation_requirement(item)
req.add_child(child_req)
return req
class Runner(object):
def __init__(self, target, perf_path):
self.target = target
self.is32 = target.endswith('32')
self.perf_path = perf_path
self.use_callgraph = False
self.sampler = 'cpu-cycles'
def record(self, test_executable_name, record_file, additional_options=[]):
call_args = [self.perf_path, 'record']
call_args += ['--duration', '2']
call_args += ['-e', '%s:u' % self.sampler]
if self.use_callgraph:
call_args += ['-f', '1000', '-g']
call_args += ['-o', record_file]
call_args += additional_options
test_executable_name += '32' if self.is32 else '64'
call_args += [test_executable_name]
self._call(call_args)
def report(self, record_file, report_file, additional_options=[]):
call_args = [self.perf_path, 'report']
call_args += ['-i', record_file]
if self.use_callgraph:
call_args += ['-g', 'callee']
call_args += additional_options
self._call(call_args, report_file)
def _call(self, args, output_file=None):
pass
class HostRunner(Runner):
"""Run perf test on host."""
def __init__(self, target):
perf_path = 'simpleperf32' if target.endswith('32') else 'simpleperf'
super(HostRunner, self).__init__(target, perf_path)
def _call(self, args, output_file=None):
output_fh = None
if output_file is not None:
output_fh = open(output_file, 'w')
subprocess.check_call(args, stdout=output_fh)
if output_fh is not None:
output_fh.close()
class DeviceRunner(Runner):
"""Run perf test on device."""
def __init__(self, target):
self.tmpdir = '/data/local/tmp/'
perf_path = 'simpleperf32' if target.endswith('32') else 'simpleperf'
super(DeviceRunner, self).__init__(target, self.tmpdir + perf_path)
self._download(os.environ['OUT'] + '/system/xbin/' + perf_path, self.tmpdir)
lib = 'lib' if self.is32 else 'lib64'
self._download(os.environ['OUT'] + '/system/' + lib + '/libsimpleperf_inplace_sampler.so',
self.tmpdir)
def _call(self, args, output_file=None):
output_fh = None
if output_file is not None:
output_fh = open(output_file, 'w')
args_with_adb = ['adb', 'shell']
args_with_adb.append('export LD_LIBRARY_PATH=' + self.tmpdir + ' && ' + ' '.join(args))
subprocess.check_call(args_with_adb, stdout=output_fh)
if output_fh is not None:
output_fh.close()
def _download(self, file, to_dir):
args = ['adb', 'push', file, to_dir]
subprocess.check_call(args)
def record(self, test_executable_name, record_file, additional_options=[]):
self._download(os.environ['OUT'] + '/system/bin/' + test_executable_name +
('32' if self.is32 else '64'), self.tmpdir)
super(DeviceRunner, self).record(self.tmpdir + test_executable_name,
self.tmpdir + record_file,
additional_options)
def report(self, record_file, report_file, additional_options=[]):
super(DeviceRunner, self).report(self.tmpdir + record_file,
report_file,
additional_options)
class ReportAnalyzer(object):
"""Check if perf.report matches expectation in Configuration."""
def _read_report_file(self, report_file, has_callgraph):
fh = open(report_file, 'r')
lines = fh.readlines()
fh.close()
lines = [x.rstrip() for x in lines]
blank_line_index = -1
for i in range(len(lines)):
if not lines[i]:
blank_line_index = i
assert blank_line_index != -1
assert blank_line_index + 1 < len(lines)
title_line = lines[blank_line_index + 1]
report_item_lines = lines[blank_line_index + 2:]
if has_callgraph:
assert re.search(r'^Children\s+Self\s+Command.+Symbol$', title_line)
else:
assert re.search(r'^Overhead\s+Command.+Symbol$', title_line)
return self._parse_report_items(report_item_lines, has_callgraph)
def _parse_report_items(self, lines, has_callgraph):
symbols = []
cur_symbol = None
call_tree_stack = {}
vertical_columns = []
last_node = None
last_depth = -1
for line in lines:
if not line:
continue
if not line[0].isspace():
if has_callgraph:
m = re.search(r'^([\d\.]+)%\s+([\d\.]+)%\s+(\S+).*\s+(\S+)$', line)
children_overhead = float(m.group(1))
overhead = float(m.group(2))
comm = m.group(3)
symbol_name = m.group(4)
cur_symbol = Symbol(symbol_name, comm, overhead, children_overhead)
symbols.append(cur_symbol)
else:
m = re.search(r'^([\d\.]+)%\s+(\S+).*\s+(\S+)$', line)
overhead = float(m.group(1))
comm = m.group(2)
symbol_name = m.group(3)
cur_symbol = Symbol(symbol_name, comm, overhead, 0)
symbols.append(cur_symbol)
# Each report item can have different column depths.
vertical_columns = []
else:
for i in range(len(line)):
if line[i] == '|':
if not vertical_columns or vertical_columns[-1] < i:
vertical_columns.append(i)
if not line.strip('| \t'):
continue
if line.find('-') == -1:
function_name = line.strip('| \t')
node = CallTreeNode(function_name)
last_node.add_child(node)
last_node = node
call_tree_stack[last_depth] = node
else:
pos = line.find('-')
depth = -1
for i in range(len(vertical_columns)):
if pos >= vertical_columns[i]:
depth = i
assert depth != -1
line = line.strip('|- \t')
m = re.search(r'^[\d\.]+%[-\s]+(.+)$', line)
if m:
function_name = m.group(1)
else:
function_name = line
node = CallTreeNode(function_name)
if depth == 0:
cur_symbol.set_call_tree(node)
else:
call_tree_stack[depth - 1].add_child(node)
call_tree_stack[depth] = node
last_node = node
last_depth = depth
return symbols
def check_report_file(self, test, report_file, has_callgraph):
symbols = self._read_report_file(report_file, has_callgraph)
if not self._check_symbol_overhead_requirements(test, symbols):
return False
if has_callgraph:
if not self._check_symbol_children_overhead_requirements(test, symbols):
return False
if not self._check_symbol_relation_requirements(test, symbols):
return False
return True
def _check_symbol_overhead_requirements(self, test, symbols):
result = True
matched = [False] * len(test.symbol_overhead_requirements)
matched_overhead = [0] * len(test.symbol_overhead_requirements)
for symbol in symbols:
for i in range(len(test.symbol_overhead_requirements)):
req = test.symbol_overhead_requirements[i]
if req.is_match(symbol):
matched[i] = True
matched_overhead[i] += symbol.overhead
for i in range(len(matched)):
if not matched[i]:
print 'requirement (%s) has no matched symbol in test %s' % (
test.symbol_overhead_requirements[i], test)
result = False
else:
fulfilled = req.check_overhead(matched_overhead[i])
if not fulfilled:
print "Symbol (%s) doesn't match requirement (%s) in test %s" % (
symbol, req, test)
result = False
return result
def _check_symbol_children_overhead_requirements(self, test, symbols):
result = True
matched = [False] * len(test.symbol_children_overhead_requirements)
for symbol in symbols:
for i in range(len(test.symbol_children_overhead_requirements)):
req = test.symbol_children_overhead_requirements[i]
if req.is_match(symbol):
matched[i] = True
fulfilled = req.check_overhead(symbol.children_overhead)
if not fulfilled:
print "Symbol (%s) doesn't match requirement (%s) in test %s" % (
symbol, req, test)
result = False
for i in range(len(matched)):
if not matched[i]:
print 'requirement (%s) has no matched symbol in test %s' % (
test.symbol_children_overhead_requirements[i], test)
result = False
return result
def _check_symbol_relation_requirements(self, test, symbols):
result = True
matched = [False] * len(test.symbol_relation_requirements)
for symbol in symbols:
for i in range(len(test.symbol_relation_requirements)):
req = test.symbol_relation_requirements[i]
if req.is_match(symbol):
matched[i] = True
fulfilled = req.check_relation(symbol.call_tree)
if not fulfilled:
print "Symbol (%s) doesn't match requirement (%s) in test %s" % (
symbol, req, test)
result = False
for i in range(len(matched)):
if not matched[i]:
print 'requirement (%s) has no matched symbol in test %s' % (
test.symbol_relation_requirements[i], test)
result = False
return result
def build_runner(target, use_callgraph, sampler):
if target == 'host32' and use_callgraph:
print "Current 64bit linux host doesn't support `simpleperf32 record -g`"
return None
if target.startswith('host'):
runner = HostRunner(target)
else:
runner = DeviceRunner(target)
runner.use_callgraph = use_callgraph
runner.sampler = sampler
return runner
def test_with_runner(runner, tests):
report_analyzer = ReportAnalyzer()
for test in tests:
runner.record(test.executable_name, 'perf.data')
if runner.sampler == 'inplace-sampler':
# TODO: fix this when inplace-sampler actually works.
runner.report('perf.data', 'perf.report')
symbols = report_analyzer._read_report_file('perf.report', runner.use_callgraph)
result = False
if len(symbols) == 1 and symbols[0].name.find('FakeFunction()') != -1:
result = True
else:
runner.report('perf.data', 'perf.report', additional_options = test.report_options)
result = report_analyzer.check_report_file(test, 'perf.report', runner.use_callgraph)
str = 'test %s on %s ' % (test.test_name, runner.target)
if runner.use_callgraph:
str += 'with call graph '
str += 'using %s ' % runner.sampler
str += ' Succeeded' if result else 'Failed'
print str
if not result:
exit(1)
def runtest(target_options, use_callgraph_options, sampler_options, selected_tests):
tests = load_config_file(os.path.dirname(os.path.realpath(__file__)) + \
'/runtest.conf')
if selected_tests is not None:
new_tests = []
for test in tests:
if test.test_name in selected_tests:
new_tests.append(test)
tests = new_tests
for target in target_options:
for use_callgraph in use_callgraph_options:
for sampler in sampler_options:
runner = build_runner(target, use_callgraph, sampler)
if runner is not None:
test_with_runner(runner, tests)
def main():
target_options = ['host64', 'host32', 'device64', 'device32']
use_callgraph_options = [False, True]
sampler_options = ['cpu-cycles', 'inplace-sampler']
selected_tests = None
i = 1
while i < len(sys.argv):
if sys.argv[i] == '--host':
target_options = ['host64', 'host32']
elif sys.argv[i] == '--device':
target_options = ['device64', 'device32']
elif sys.argv[i] == '--normal':
use_callgraph_options = [False]
elif sys.argv[i] == '--callgraph':
use_callgraph_options = [True]
elif sys.argv[i] == '--no-inplace-sampler':
sampler_options = ['cpu-cycles']
elif sys.argv[i] == '--inplace-sampler':
sampler_options = ['inplace-sampler']
elif sys.argv[i] == '--test':
if i < len(sys.argv):
i += 1
for test in sys.argv[i].split(','):
if selected_tests is None:
selected_tests = {}
selected_tests[test] = True
i += 1
runtest(target_options, use_callgraph_options, sampler_options, selected_tests)
if __name__ == '__main__':
main()