# Copyright (c) 2013 The Chromium OS Authors. All rights reserved. # Use of this source code is governed by a BSD-style license that can be # found in the LICENSE file. """A module to handle the report format.""" from __future__ import print_function import datetime import functools import itertools import json import os import re from cros_utils.tabulator import AmeanResult from cros_utils.tabulator import Cell from cros_utils.tabulator import CoeffVarFormat from cros_utils.tabulator import CoeffVarResult from cros_utils.tabulator import Column from cros_utils.tabulator import Format from cros_utils.tabulator import GmeanRatioResult from cros_utils.tabulator import LiteralResult from cros_utils.tabulator import MaxResult from cros_utils.tabulator import MinResult from cros_utils.tabulator import PValueFormat from cros_utils.tabulator import PValueResult from cros_utils.tabulator import RatioFormat from cros_utils.tabulator import RawResult from cros_utils.tabulator import StdResult from cros_utils.tabulator import TableFormatter from cros_utils.tabulator import TableGenerator from cros_utils.tabulator import TablePrinter from update_telemetry_defaults import TelemetryDefaults from column_chart import ColumnChart from results_organizer import OrganizeResults import results_report_templates as templates def ParseChromeosImage(chromeos_image): """Parse the chromeos_image string for the image and version. The chromeos_image string will probably be in one of two formats: 1: <path-to-chroot>/src/build/images/<board>/<ChromeOS-version>.<datetime>/ \ chromiumos_test_image.bin 2: <path-to-chroot>/chroot/tmp/<buildbot-build>/<ChromeOS-version>/ \ chromiumos_test_image.bin We parse these strings to find the 'chromeos_version' to store in the json archive (without the .datatime bit in the first case); and also the 'chromeos_image', which would be all of the first case, but only the part after '/chroot/tmp' in the second case. Args: chromeos_image: string containing the path to the chromeos_image that crosperf used for the test. Returns: version, image: The results of parsing the input string, as explained above. """ # Find the Chromeos Version, e.g. R45-2345.0.0..... # chromeos_image should have been something like: # <path>/<board-trybot-release>/<chromeos-version>/chromiumos_test_image.bin" if chromeos_image.endswith('/chromiumos_test_image.bin'): full_version = chromeos_image.split('/')[-2] # Strip the date and time off of local builds (which have the format # "R43-2345.0.0.date-and-time"). version, _ = os.path.splitext(full_version) else: version = '' # Find the chromeos image. If it's somewhere in .../chroot/tmp/..., then # it's an official image that got downloaded, so chop off the download path # to make the official image name more clear. official_image_path = '/chroot/tmp' if official_image_path in chromeos_image: image = chromeos_image.split(official_image_path, 1)[1] else: image = chromeos_image return version, image def _AppendUntilLengthIs(gen, the_list, target_len): """Appends to `list` until `list` is `target_len` elements long. Uses `gen` to generate elements. """ the_list.extend(gen() for _ in xrange(target_len - len(the_list))) return the_list def _FilterPerfReport(event_threshold, report): """Filters out entries with `< event_threshold` percent in a perf report.""" def filter_dict(m): return { fn_name: pct for fn_name, pct in m.iteritems() if pct >= event_threshold } return {event: filter_dict(m) for event, m in report.iteritems()} class _PerfTable(object): """Generates dicts from a perf table. Dicts look like: {'benchmark_name': {'perf_event_name': [LabelData]}} where LabelData is a list of perf dicts, each perf dict coming from the same label. Each perf dict looks like {'function_name': 0.10, ...} (where 0.10 is the percentage of time spent in function_name). """ def __init__(self, benchmark_names_and_iterations, label_names, read_perf_report, event_threshold=None): """Constructor. read_perf_report is a function that takes a label name, benchmark name, and benchmark iteration, and returns a dictionary describing the perf output for that given run. """ self.event_threshold = event_threshold self._label_indices = {name: i for i, name in enumerate(label_names)} self.perf_data = {} for label in label_names: for bench_name, bench_iterations in benchmark_names_and_iterations: for i in xrange(bench_iterations): report = read_perf_report(label, bench_name, i) self._ProcessPerfReport(report, label, bench_name, i) def _ProcessPerfReport(self, perf_report, label, benchmark_name, iteration): """Add the data from one run to the dict.""" perf_of_run = perf_report if self.event_threshold is not None: perf_of_run = _FilterPerfReport(self.event_threshold, perf_report) if benchmark_name not in self.perf_data: self.perf_data[benchmark_name] = {event: [] for event in perf_of_run} ben_data = self.perf_data[benchmark_name] label_index = self._label_indices[label] for event in ben_data: _AppendUntilLengthIs(list, ben_data[event], label_index + 1) data_for_label = ben_data[event][label_index] _AppendUntilLengthIs(dict, data_for_label, iteration + 1) data_for_label[iteration] = perf_of_run[event] if perf_of_run else {} def _GetResultsTableHeader(ben_name, iterations): benchmark_info = ('Benchmark: {0}; Iterations: {1}'.format( ben_name, iterations)) cell = Cell() cell.string_value = benchmark_info cell.header = True return [[cell]] def _ParseColumn(columns, iteration): new_column = [] for column in columns: if column.result.__class__.__name__ != 'RawResult': new_column.append(column) else: new_column.extend( Column(LiteralResult(i), Format(), str(i + 1)) for i in xrange(iteration)) return new_column def _GetTables(benchmark_results, columns, table_type): iter_counts = benchmark_results.iter_counts result = benchmark_results.run_keyvals tables = [] for bench_name, runs in result.iteritems(): iterations = iter_counts[bench_name] ben_table = _GetResultsTableHeader(bench_name, iterations) all_runs_empty = all(not dict for label in runs for dict in label) if all_runs_empty: cell = Cell() cell.string_value = ('This benchmark contains no result.' ' Is the benchmark name valid?') cell_table = [[cell]] else: table = TableGenerator(runs, benchmark_results.label_names).GetTable() parsed_columns = _ParseColumn(columns, iterations) tf = TableFormatter(table, parsed_columns) cell_table = tf.GetCellTable(table_type) tables.append(ben_table) tables.append(cell_table) return tables def _GetPerfTables(benchmark_results, columns, table_type): p_table = _PerfTable(benchmark_results.benchmark_names_and_iterations, benchmark_results.label_names, benchmark_results.read_perf_report) tables = [] for benchmark in p_table.perf_data: iterations = benchmark_results.iter_counts[benchmark] ben_table = _GetResultsTableHeader(benchmark, iterations) tables.append(ben_table) benchmark_data = p_table.perf_data[benchmark] table = [] for event in benchmark_data: tg = TableGenerator( benchmark_data[event], benchmark_results.label_names, sort=TableGenerator.SORT_BY_VALUES_DESC) table = tg.GetTable(ResultsReport.PERF_ROWS) parsed_columns = _ParseColumn(columns, iterations) tf = TableFormatter(table, parsed_columns) tf.GenerateCellTable(table_type) tf.AddColumnName() tf.AddLabelName() tf.AddHeader(str(event)) table = tf.GetCellTable(table_type, headers=False) tables.append(table) return tables class ResultsReport(object): """Class to handle the report format.""" MAX_COLOR_CODE = 255 PERF_ROWS = 5 def __init__(self, results): self.benchmark_results = results def _GetTablesWithColumns(self, columns, table_type, perf): get_tables = _GetPerfTables if perf else _GetTables return get_tables(self.benchmark_results, columns, table_type) def GetFullTables(self, perf=False): columns = [ Column(RawResult(), Format()), Column(MinResult(), Format()), Column( MaxResult(), Format()), Column(AmeanResult(), Format()), Column( StdResult(), Format(), 'StdDev'), Column(CoeffVarResult(), CoeffVarFormat(), 'StdDev/Mean'), Column( GmeanRatioResult(), RatioFormat(), 'GmeanSpeedup'), Column( PValueResult(), PValueFormat(), 'p-value') ] return self._GetTablesWithColumns(columns, 'full', perf) def GetSummaryTables(self, perf=False): columns = [ Column(AmeanResult(), Format()), Column(StdResult(), Format(), 'StdDev'), Column(CoeffVarResult(), CoeffVarFormat(), 'StdDev/Mean'), Column( GmeanRatioResult(), RatioFormat(), 'GmeanSpeedup'), Column( PValueResult(), PValueFormat(), 'p-value') ] return self._GetTablesWithColumns(columns, 'summary', perf) def _PrintTable(tables, out_to): # tables may be None. if not tables: return '' if out_to == 'HTML': out_type = TablePrinter.HTML elif out_to == 'PLAIN': out_type = TablePrinter.PLAIN elif out_to == 'CONSOLE': out_type = TablePrinter.CONSOLE elif out_to == 'TSV': out_type = TablePrinter.TSV elif out_to == 'EMAIL': out_type = TablePrinter.EMAIL else: raise ValueError('Invalid out_to value: %s' % (out_to,)) printers = (TablePrinter(table, out_type) for table in tables) return ''.join(printer.Print() for printer in printers) class TextResultsReport(ResultsReport): """Class to generate text result report.""" H1_STR = '===========================================' H2_STR = '-------------------------------------------' def __init__(self, results, email=False, experiment=None): super(TextResultsReport, self).__init__(results) self.email = email self.experiment = experiment @staticmethod def _MakeTitle(title): header_line = TextResultsReport.H1_STR # '' at the end gives one newline. return '\n'.join([header_line, title, header_line, '']) @staticmethod def _MakeSection(title, body): header_line = TextResultsReport.H2_STR # '\n' at the end gives us two newlines. return '\n'.join([header_line, title, header_line, body, '\n']) @staticmethod def FromExperiment(experiment, email=False): results = BenchmarkResults.FromExperiment(experiment) return TextResultsReport(results, email, experiment) def GetStatusTable(self): """Generate the status table by the tabulator.""" table = [['', '']] columns = [ Column(LiteralResult(iteration=0), Format(), 'Status'), Column( LiteralResult(iteration=1), Format(), 'Failing Reason') ] for benchmark_run in self.experiment.benchmark_runs: status = [ benchmark_run.name, [benchmark_run.timeline.GetLastEvent(), benchmark_run.failure_reason] ] table.append(status) cell_table = TableFormatter(table, columns).GetCellTable('status') return [cell_table] def GetReport(self): """Generate the report for email and console.""" output_type = 'EMAIL' if self.email else 'CONSOLE' experiment = self.experiment sections = [] if experiment is not None: title_contents = "Results report for '%s'" % (experiment.name,) else: title_contents = 'Results report' sections.append(self._MakeTitle(title_contents)) summary_table = _PrintTable(self.GetSummaryTables(perf=False), output_type) sections.append(self._MakeSection('Summary', summary_table)) if experiment is not None: table = _PrintTable(self.GetStatusTable(), output_type) sections.append(self._MakeSection('Benchmark Run Status', table)) perf_table = _PrintTable(self.GetSummaryTables(perf=True), output_type) if perf_table: sections.append(self._MakeSection('Perf Data', perf_table)) if experiment is not None: experiment_file = experiment.experiment_file sections.append(self._MakeSection('Experiment File', experiment_file)) cpu_info = experiment.machine_manager.GetAllCPUInfo(experiment.labels) sections.append(self._MakeSection('CPUInfo', cpu_info)) return '\n'.join(sections) def _GetHTMLCharts(label_names, test_results): charts = [] for item, runs in test_results.iteritems(): # Fun fact: label_names is actually *entirely* useless as a param, since we # never add headers. We still need to pass it anyway. table = TableGenerator(runs, label_names).GetTable() columns = [ Column(AmeanResult(), Format()), Column(MinResult(), Format()), Column( MaxResult(), Format()) ] tf = TableFormatter(table, columns) data_table = tf.GetCellTable('full', headers=False) for cur_row_data in data_table: test_key = cur_row_data[0].string_value title = '{0}: {1}'.format(item, test_key.replace('/', '')) chart = ColumnChart(title, 300, 200) chart.AddColumn('Label', 'string') chart.AddColumn('Average', 'number') chart.AddColumn('Min', 'number') chart.AddColumn('Max', 'number') chart.AddSeries('Min', 'line', 'black') chart.AddSeries('Max', 'line', 'black') cur_index = 1 for label in label_names: chart.AddRow([ label, cur_row_data[cur_index].value, cur_row_data[cur_index + 1].value, cur_row_data[cur_index + 2].value ]) if isinstance(cur_row_data[cur_index].value, str): chart = None break cur_index += 3 if chart: charts.append(chart) return charts class HTMLResultsReport(ResultsReport): """Class to generate html result report.""" def __init__(self, benchmark_results, experiment=None): super(HTMLResultsReport, self).__init__(benchmark_results) self.experiment = experiment @staticmethod def FromExperiment(experiment): return HTMLResultsReport( BenchmarkResults.FromExperiment(experiment), experiment=experiment) def GetReport(self): label_names = self.benchmark_results.label_names test_results = self.benchmark_results.run_keyvals charts = _GetHTMLCharts(label_names, test_results) chart_javascript = ''.join(chart.GetJavascript() for chart in charts) chart_divs = ''.join(chart.GetDiv() for chart in charts) summary_table = self.GetSummaryTables() full_table = self.GetFullTables() perf_table = self.GetSummaryTables(perf=True) experiment_file = '' if self.experiment is not None: experiment_file = self.experiment.experiment_file # Use kwargs for sanity, and so that testing is a bit easier. return templates.GenerateHTMLPage( perf_table=perf_table, chart_js=chart_javascript, summary_table=summary_table, print_table=_PrintTable, chart_divs=chart_divs, full_table=full_table, experiment_file=experiment_file) def ParseStandardPerfReport(report_data): """Parses the output of `perf report`. It'll parse the following: {{garbage}} # Samples: 1234M of event 'foo' 1.23% command shared_object location function::name 1.22% command shared_object location function2::name # Samples: 999K of event 'bar' 0.23% command shared_object location function3::name {{etc.}} Into: {'foo': {'function::name': 1.23, 'function2::name': 1.22}, 'bar': {'function3::name': 0.23, etc.}} """ # This function fails silently on its if it's handed a string (as opposed to a # list of lines). So, auto-split if we do happen to get a string. if isinstance(report_data, basestring): report_data = report_data.splitlines() # Samples: N{K,M,G} of event 'event-name' samples_regex = re.compile(r"#\s+Samples: \d+\S? of event '([^']+)'") # We expect lines like: # N.NN% command samples shared_object [location] symbol # # Note that we're looking at stripped lines, so there is no space at the # start. perf_regex = re.compile(r'^(\d+(?:.\d*)?)%' # N.NN% r'\s*\d+' # samples count (ignored) r'\s*\S+' # command (ignored) r'\s*\S+' # shared_object (ignored) r'\s*\[.\]' # location (ignored) r'\s*(\S.+)' # function ) stripped_lines = (l.strip() for l in report_data) nonempty_lines = (l for l in stripped_lines if l) # Ignore all lines before we see samples_regex interesting_lines = itertools.dropwhile(lambda x: not samples_regex.match(x), nonempty_lines) first_sample_line = next(interesting_lines, None) # Went through the entire file without finding a 'samples' header. Quit. if first_sample_line is None: return {} sample_name = samples_regex.match(first_sample_line).group(1) current_result = {} results = {sample_name: current_result} for line in interesting_lines: samples_match = samples_regex.match(line) if samples_match: sample_name = samples_match.group(1) current_result = {} results[sample_name] = current_result continue match = perf_regex.match(line) if not match: continue percentage_str, func_name = match.groups() try: percentage = float(percentage_str) except ValueError: # Couldn't parse it; try to be "resilient". continue current_result[func_name] = percentage return results def _ReadExperimentPerfReport(results_directory, label_name, benchmark_name, benchmark_iteration): """Reads a perf report for the given benchmark. Returns {} on failure. The result should be a map of maps; it should look like: {perf_event_name: {function_name: pct_time_spent}}, e.g. {'cpu_cycles': {'_malloc': 10.0, '_free': 0.3, ...}} """ raw_dir_name = label_name + benchmark_name + str(benchmark_iteration + 1) dir_name = ''.join(c for c in raw_dir_name if c.isalnum()) file_name = os.path.join(results_directory, dir_name, 'perf.data.report.0') try: with open(file_name) as in_file: return ParseStandardPerfReport(in_file) except IOError: # Yes, we swallow any IO-related errors. return {} # Split out so that testing (specifically: mocking) is easier def _ExperimentToKeyvals(experiment, for_json_report): """Converts an experiment to keyvals.""" return OrganizeResults( experiment.benchmark_runs, experiment.labels, json_report=for_json_report) class BenchmarkResults(object): """The minimum set of fields that any ResultsReport will take.""" def __init__(self, label_names, benchmark_names_and_iterations, run_keyvals, read_perf_report=None): if read_perf_report is None: def _NoPerfReport(*_args, **_kwargs): return {} read_perf_report = _NoPerfReport self.label_names = label_names self.benchmark_names_and_iterations = benchmark_names_and_iterations self.iter_counts = dict(benchmark_names_and_iterations) self.run_keyvals = run_keyvals self.read_perf_report = read_perf_report @staticmethod def FromExperiment(experiment, for_json_report=False): label_names = [label.name for label in experiment.labels] benchmark_names_and_iterations = [(benchmark.name, benchmark.iterations) for benchmark in experiment.benchmarks] run_keyvals = _ExperimentToKeyvals(experiment, for_json_report) read_perf_report = functools.partial(_ReadExperimentPerfReport, experiment.results_directory) return BenchmarkResults(label_names, benchmark_names_and_iterations, run_keyvals, read_perf_report) def _GetElemByName(name, from_list): """Gets an element from the given list by its name field. Raises an error if it doesn't find exactly one match. """ elems = [e for e in from_list if e.name == name] if len(elems) != 1: raise ValueError('Expected 1 item named %s, found %d' % (name, len(elems))) return elems[0] def _Unlist(l): """If l is a list, extracts the first element of l. Otherwise, returns l.""" return l[0] if isinstance(l, list) else l class JSONResultsReport(ResultsReport): """Class that generates JSON reports for experiments.""" def __init__(self, benchmark_results, date=None, time=None, experiment=None, json_args=None): """Construct a JSONResultsReport. json_args is the dict of arguments we pass to json.dumps in GetReport(). """ super(JSONResultsReport, self).__init__(benchmark_results) defaults = TelemetryDefaults() defaults.ReadDefaultsFile() summary_field_defaults = defaults.GetDefault() if summary_field_defaults is None: summary_field_defaults = {} self.summary_field_defaults = summary_field_defaults if json_args is None: json_args = {} self.json_args = json_args self.experiment = experiment if not date: timestamp = datetime.datetime.strftime(datetime.datetime.now(), '%Y-%m-%d %H:%M:%S') date, time = timestamp.split(' ') self.date = date self.time = time @staticmethod def FromExperiment(experiment, date=None, time=None, json_args=None): benchmark_results = BenchmarkResults.FromExperiment( experiment, for_json_report=True) return JSONResultsReport(benchmark_results, date, time, experiment, json_args) def GetReportObjectIgnoringExperiment(self): """Gets the JSON report object specifically for the output data. Ignores any experiment-specific fields (e.g. board, machine checksum, ...). """ benchmark_results = self.benchmark_results label_names = benchmark_results.label_names summary_field_defaults = self.summary_field_defaults final_results = [] for test, test_results in benchmark_results.run_keyvals.iteritems(): for label_name, label_results in zip(label_names, test_results): for iter_results in label_results: passed = iter_results.get('retval') == 0 json_results = { 'date': self.date, 'time': self.time, 'label': label_name, 'test_name': test, 'pass': passed, } final_results.append(json_results) if not passed: continue # Get overall results. summary_fields = summary_field_defaults.get(test) if summary_fields is not None: value = [] json_results['overall_result'] = value for f in summary_fields: v = iter_results.get(f) if v is None: continue # New telemetry results format: sometimes we get a list of lists # now. v = _Unlist(_Unlist(v)) value.append((f, float(v))) # Get detailed results. detail_results = {} json_results['detailed_results'] = detail_results for k, v in iter_results.iteritems(): if k == 'retval' or k == 'PASS' or k == ['PASS'] or v == 'PASS': continue v = _Unlist(v) if 'machine' in k: json_results[k] = v elif v is not None: if isinstance(v, list): detail_results[k] = [float(d) for d in v] else: detail_results[k] = float(v) return final_results def GetReportObject(self): """Generate the JSON report, returning it as a python object.""" report_list = self.GetReportObjectIgnoringExperiment() if self.experiment is not None: self._AddExperimentSpecificFields(report_list) return report_list def _AddExperimentSpecificFields(self, report_list): """Add experiment-specific data to the JSON report.""" board = self.experiment.labels[0].board manager = self.experiment.machine_manager for report in report_list: label_name = report['label'] label = _GetElemByName(label_name, self.experiment.labels) img_path = os.path.realpath(os.path.expanduser(label.chromeos_image)) ver, img = ParseChromeosImage(img_path) report.update({ 'board': board, 'chromeos_image': img, 'chromeos_version': ver, 'chrome_version': label.chrome_version, 'compiler': label.compiler }) if not report['pass']: continue if 'machine_checksum' not in report: report['machine_checksum'] = manager.machine_checksum[label_name] if 'machine_string' not in report: report['machine_string'] = manager.machine_checksum_string[label_name] def GetReport(self): """Dump the results of self.GetReportObject() to a string as JSON.""" # This exists for consistency with the other GetReport methods. # Specifically, they all return strings, so it's a bit awkward if the JSON # results reporter returns an object. return json.dumps(self.GetReportObject(), **self.json_args)