| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 1 | #!/usr/bin/python3 | 
|  | 2 | # | 
|  | 3 | # Examine build performance test results | 
|  | 4 | # | 
|  | 5 | # Copyright (c) 2017, Intel Corporation. | 
|  | 6 | # | 
| Brad Bishop | c342db3 | 2019-05-15 21:57:59 -0400 | [diff] [blame] | 7 | # SPDX-License-Identifier: GPL-2.0-only | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 8 | # | 
| Brad Bishop | c342db3 | 2019-05-15 21:57:59 -0400 | [diff] [blame] | 9 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 10 | import argparse | 
|  | 11 | import json | 
|  | 12 | import logging | 
|  | 13 | import os | 
|  | 14 | import re | 
|  | 15 | import sys | 
|  | 16 | from collections import namedtuple, OrderedDict | 
|  | 17 | from operator import attrgetter | 
|  | 18 | from xml.etree import ElementTree as ET | 
|  | 19 |  | 
|  | 20 | # Import oe libs | 
|  | 21 | scripts_path = os.path.dirname(os.path.realpath(__file__)) | 
|  | 22 | sys.path.append(os.path.join(scripts_path, 'lib')) | 
|  | 23 | import scriptpath | 
|  | 24 | from build_perf import print_table | 
|  | 25 | from build_perf.report import (metadata_xml_to_json, results_xml_to_json, | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 26 | aggregate_data, aggregate_metadata, measurement_stats, | 
|  | 27 | AggregateTestData) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 28 | from build_perf import html | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 29 | from buildstats import BuildStats, diff_buildstats, BSVerDiff | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 30 |  | 
|  | 31 | scriptpath.add_oe_lib_path() | 
|  | 32 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 33 | from oeqa.utils.git import GitRepo, GitError | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 34 | import oeqa.utils.gitarchive as gitarchive | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 35 |  | 
|  | 36 |  | 
|  | 37 | # Setup logging | 
|  | 38 | logging.basicConfig(level=logging.INFO, format="%(levelname)s: %(message)s") | 
|  | 39 | log = logging.getLogger('oe-build-perf-report') | 
|  | 40 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 41 | def list_test_revs(repo, tag_name, verbosity, **kwargs): | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 42 | """Get list of all tested revisions""" | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 43 | valid_kwargs = dict([(k, v) for k, v in kwargs.items() if v is not None]) | 
|  | 44 |  | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 45 | fields, revs = gitarchive.get_test_runs(log, repo, tag_name, **valid_kwargs) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 46 | ignore_fields = ['tag_number'] | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 47 | if verbosity < 2: | 
|  | 48 | extra_fields = ['COMMITS', 'TEST RUNS'] | 
|  | 49 | ignore_fields.extend(['commit_number', 'commit']) | 
|  | 50 | else: | 
|  | 51 | extra_fields = ['TEST RUNS'] | 
|  | 52 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 53 | print_fields = [i for i, f in enumerate(fields) if f not in ignore_fields] | 
|  | 54 |  | 
|  | 55 | # Sort revs | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 56 | rows = [[fields[i].upper() for i in print_fields] + extra_fields] | 
|  | 57 |  | 
|  | 58 | prev = [''] * len(print_fields) | 
|  | 59 | prev_commit = None | 
|  | 60 | commit_cnt = 0 | 
|  | 61 | commit_field = fields.index('commit') | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 62 | for rev in revs: | 
|  | 63 | # Only use fields that we want to print | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 64 | cols = [rev[i] for i in print_fields] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 65 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 66 |  | 
|  | 67 | if cols != prev: | 
|  | 68 | commit_cnt = 1 | 
|  | 69 | test_run_cnt = 1 | 
|  | 70 | new_row = [''] * (len(print_fields) + len(extra_fields)) | 
|  | 71 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 72 | for i in print_fields: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 73 | if cols[i] != prev[i]: | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 74 | break | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 75 | new_row[i:-len(extra_fields)] = cols[i:] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 76 | rows.append(new_row) | 
|  | 77 | else: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 78 | if rev[commit_field] != prev_commit: | 
|  | 79 | commit_cnt += 1 | 
|  | 80 | test_run_cnt += 1 | 
|  | 81 |  | 
|  | 82 | if verbosity < 2: | 
|  | 83 | new_row[-2] = commit_cnt | 
|  | 84 | new_row[-1] = test_run_cnt | 
|  | 85 | prev = cols | 
|  | 86 | prev_commit = rev[commit_field] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 87 |  | 
|  | 88 | print_table(rows) | 
|  | 89 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 90 | def is_xml_format(repo, commit): | 
|  | 91 | """Check if the commit contains xml (or json) data""" | 
|  | 92 | if repo.rev_parse(commit + ':results.xml'): | 
|  | 93 | log.debug("Detected report in xml format in %s", commit) | 
|  | 94 | return True | 
|  | 95 | else: | 
|  | 96 | log.debug("No xml report in %s, assuming json formatted results", commit) | 
|  | 97 | return False | 
|  | 98 |  | 
|  | 99 | def read_results(repo, tags, xml=True): | 
|  | 100 | """Read result files from repo""" | 
|  | 101 |  | 
|  | 102 | def parse_xml_stream(data): | 
|  | 103 | """Parse multiple concatenated XML objects""" | 
|  | 104 | objs = [] | 
|  | 105 | xml_d = "" | 
|  | 106 | for line in data.splitlines(): | 
|  | 107 | if xml_d and line.startswith('<?xml version='): | 
|  | 108 | objs.append(ET.fromstring(xml_d)) | 
|  | 109 | xml_d = line | 
|  | 110 | else: | 
|  | 111 | xml_d += line | 
|  | 112 | objs.append(ET.fromstring(xml_d)) | 
|  | 113 | return objs | 
|  | 114 |  | 
|  | 115 | def parse_json_stream(data): | 
|  | 116 | """Parse multiple concatenated JSON objects""" | 
|  | 117 | objs = [] | 
|  | 118 | json_d = "" | 
|  | 119 | for line in data.splitlines(): | 
|  | 120 | if line == '}{': | 
|  | 121 | json_d += '}' | 
|  | 122 | objs.append(json.loads(json_d, object_pairs_hook=OrderedDict)) | 
|  | 123 | json_d = '{' | 
|  | 124 | else: | 
|  | 125 | json_d += line | 
|  | 126 | objs.append(json.loads(json_d, object_pairs_hook=OrderedDict)) | 
|  | 127 | return objs | 
|  | 128 |  | 
|  | 129 | num_revs = len(tags) | 
|  | 130 |  | 
|  | 131 | # Optimize by reading all data with one git command | 
|  | 132 | log.debug("Loading raw result data from %d tags, %s...", num_revs, tags[0]) | 
|  | 133 | if xml: | 
|  | 134 | git_objs = [tag + ':metadata.xml' for tag in tags] + [tag + ':results.xml' for tag in tags] | 
|  | 135 | data = parse_xml_stream(repo.run_cmd(['show'] + git_objs + ['--'])) | 
|  | 136 | return ([metadata_xml_to_json(e) for e in data[0:num_revs]], | 
|  | 137 | [results_xml_to_json(e) for e in data[num_revs:]]) | 
|  | 138 | else: | 
|  | 139 | git_objs = [tag + ':metadata.json' for tag in tags] + [tag + ':results.json' for tag in tags] | 
|  | 140 | data = parse_json_stream(repo.run_cmd(['show'] + git_objs + ['--'])) | 
|  | 141 | return data[0:num_revs], data[num_revs:] | 
|  | 142 |  | 
|  | 143 |  | 
|  | 144 | def get_data_item(data, key): | 
|  | 145 | """Nested getitem lookup""" | 
|  | 146 | for k in key.split('.'): | 
|  | 147 | data = data[k] | 
|  | 148 | return data | 
|  | 149 |  | 
|  | 150 |  | 
|  | 151 | def metadata_diff(metadata_l, metadata_r): | 
|  | 152 | """Prepare a metadata diff for printing""" | 
|  | 153 | keys = [('Hostname', 'hostname', 'hostname'), | 
|  | 154 | ('Branch', 'branch', 'layers.meta.branch'), | 
|  | 155 | ('Commit number', 'commit_num', 'layers.meta.commit_count'), | 
|  | 156 | ('Commit', 'commit', 'layers.meta.commit'), | 
|  | 157 | ('Number of test runs', 'testrun_count', 'testrun_count') | 
|  | 158 | ] | 
|  | 159 |  | 
|  | 160 | def _metadata_diff(key): | 
|  | 161 | """Diff metadata from two test reports""" | 
|  | 162 | try: | 
|  | 163 | val1 = get_data_item(metadata_l, key) | 
|  | 164 | except KeyError: | 
|  | 165 | val1 = '(N/A)' | 
|  | 166 | try: | 
|  | 167 | val2 = get_data_item(metadata_r, key) | 
|  | 168 | except KeyError: | 
|  | 169 | val2 = '(N/A)' | 
|  | 170 | return val1, val2 | 
|  | 171 |  | 
|  | 172 | metadata = OrderedDict() | 
|  | 173 | for title, key, key_json in keys: | 
|  | 174 | value_l, value_r = _metadata_diff(key_json) | 
|  | 175 | metadata[key] = {'title': title, | 
|  | 176 | 'value_old': value_l, | 
|  | 177 | 'value': value_r} | 
|  | 178 | return metadata | 
|  | 179 |  | 
|  | 180 |  | 
|  | 181 | def print_diff_report(metadata_l, data_l, metadata_r, data_r): | 
|  | 182 | """Print differences between two data sets""" | 
|  | 183 |  | 
|  | 184 | # First, print general metadata | 
|  | 185 | print("\nTEST METADATA:\n==============") | 
|  | 186 | meta_diff = metadata_diff(metadata_l, metadata_r) | 
|  | 187 | rows = [] | 
|  | 188 | row_fmt = ['{:{wid}} ', '{:<{wid}}   ', '{:<{wid}}'] | 
|  | 189 | rows = [['', 'CURRENT COMMIT', 'COMPARING WITH']] | 
|  | 190 | for key, val in meta_diff.items(): | 
|  | 191 | # Shorten commit hashes | 
|  | 192 | if key == 'commit': | 
|  | 193 | rows.append([val['title'] + ':', val['value'][:20], val['value_old'][:20]]) | 
|  | 194 | else: | 
|  | 195 | rows.append([val['title'] + ':', val['value'], val['value_old']]) | 
|  | 196 | print_table(rows, row_fmt) | 
|  | 197 |  | 
|  | 198 |  | 
|  | 199 | # Print test results | 
|  | 200 | print("\nTEST RESULTS:\n=============") | 
|  | 201 |  | 
|  | 202 | tests = list(data_l['tests'].keys()) | 
|  | 203 | # Append tests that are only present in 'right' set | 
|  | 204 | tests += [t for t in list(data_r['tests'].keys()) if t not in tests] | 
|  | 205 |  | 
|  | 206 | # Prepare data to be printed | 
|  | 207 | rows = [] | 
|  | 208 | row_fmt = ['{:8}', '{:{wid}}', '{:{wid}}', '  {:>{wid}}', ' {:{wid}} ', '{:{wid}}', | 
|  | 209 | '  {:>{wid}}', '  {:>{wid}}'] | 
|  | 210 | num_cols = len(row_fmt) | 
|  | 211 | for test in tests: | 
|  | 212 | test_l = data_l['tests'][test] if test in data_l['tests'] else None | 
|  | 213 | test_r = data_r['tests'][test] if test in data_r['tests'] else None | 
|  | 214 | pref = ' ' | 
|  | 215 | if test_l is None: | 
|  | 216 | pref = '+' | 
|  | 217 | elif test_r is None: | 
|  | 218 | pref = '-' | 
|  | 219 | descr = test_l['description'] if test_l else test_r['description'] | 
|  | 220 | heading = "{} {}: {}".format(pref, test, descr) | 
|  | 221 |  | 
|  | 222 | rows.append([heading]) | 
|  | 223 |  | 
|  | 224 | # Generate the list of measurements | 
|  | 225 | meas_l = test_l['measurements'] if test_l else {} | 
|  | 226 | meas_r = test_r['measurements'] if test_r else {} | 
|  | 227 | measurements = list(meas_l.keys()) | 
|  | 228 | measurements += [m for m in list(meas_r.keys()) if m not in measurements] | 
|  | 229 |  | 
|  | 230 | for meas in measurements: | 
|  | 231 | m_pref = ' ' | 
|  | 232 | if meas in meas_l: | 
|  | 233 | stats_l = measurement_stats(meas_l[meas], 'l.') | 
|  | 234 | else: | 
|  | 235 | stats_l = measurement_stats(None, 'l.') | 
|  | 236 | m_pref = '+' | 
|  | 237 | if meas in meas_r: | 
|  | 238 | stats_r = measurement_stats(meas_r[meas], 'r.') | 
|  | 239 | else: | 
|  | 240 | stats_r = measurement_stats(None, 'r.') | 
|  | 241 | m_pref = '-' | 
|  | 242 | stats = stats_l.copy() | 
|  | 243 | stats.update(stats_r) | 
|  | 244 |  | 
|  | 245 | absdiff = stats['val_cls'](stats['r.mean'] - stats['l.mean']) | 
|  | 246 | reldiff = "{:+.1f} %".format(absdiff * 100 / stats['l.mean']) | 
|  | 247 | if stats['r.mean'] > stats['l.mean']: | 
|  | 248 | absdiff = '+' + str(absdiff) | 
|  | 249 | else: | 
|  | 250 | absdiff = str(absdiff) | 
|  | 251 | rows.append(['', m_pref, stats['name'] + ' ' + stats['quantity'], | 
|  | 252 | str(stats['l.mean']), '->', str(stats['r.mean']), | 
|  | 253 | absdiff, reldiff]) | 
|  | 254 | rows.append([''] * num_cols) | 
|  | 255 |  | 
|  | 256 | print_table(rows, row_fmt) | 
|  | 257 |  | 
|  | 258 | print() | 
|  | 259 |  | 
|  | 260 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 261 | class BSSummary(object): | 
|  | 262 | def __init__(self, bs1, bs2): | 
|  | 263 | self.tasks = {'count': bs2.num_tasks, | 
|  | 264 | 'change': '{:+d}'.format(bs2.num_tasks - bs1.num_tasks)} | 
|  | 265 | self.top_consumer = None | 
|  | 266 | self.top_decrease = None | 
|  | 267 | self.top_increase = None | 
|  | 268 | self.ver_diff = OrderedDict() | 
|  | 269 |  | 
|  | 270 | tasks_diff = diff_buildstats(bs1, bs2, 'cputime') | 
|  | 271 |  | 
|  | 272 | # Get top consumers of resources | 
|  | 273 | tasks_diff = sorted(tasks_diff, key=attrgetter('value2')) | 
|  | 274 | self.top_consumer = tasks_diff[-5:] | 
|  | 275 |  | 
|  | 276 | # Get biggest increase and decrease in resource usage | 
|  | 277 | tasks_diff = sorted(tasks_diff, key=attrgetter('absdiff')) | 
|  | 278 | self.top_decrease = tasks_diff[0:5] | 
|  | 279 | self.top_increase = tasks_diff[-5:] | 
|  | 280 |  | 
|  | 281 | # Compare recipe versions and prepare data for display | 
|  | 282 | ver_diff = BSVerDiff(bs1, bs2) | 
|  | 283 | if ver_diff: | 
|  | 284 | if ver_diff.new: | 
|  | 285 | self.ver_diff['New recipes'] = [(n, r.evr) for n, r in ver_diff.new.items()] | 
|  | 286 | if ver_diff.dropped: | 
|  | 287 | self.ver_diff['Dropped recipes'] = [(n, r.evr) for n, r in ver_diff.dropped.items()] | 
|  | 288 | if ver_diff.echanged: | 
|  | 289 | self.ver_diff['Epoch changed'] = [(n, "{} → {}".format(r.left.evr, r.right.evr)) for n, r in ver_diff.echanged.items()] | 
|  | 290 | if ver_diff.vchanged: | 
|  | 291 | self.ver_diff['Version changed'] = [(n, "{} → {}".format(r.left.version, r.right.version)) for n, r in ver_diff.vchanged.items()] | 
|  | 292 | if ver_diff.rchanged: | 
|  | 293 | self.ver_diff['Revision changed'] = [(n, "{} → {}".format(r.left.evr, r.right.evr)) for n, r in ver_diff.rchanged.items()] | 
|  | 294 |  | 
|  | 295 |  | 
|  | 296 | def print_html_report(data, id_comp, buildstats): | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 297 | """Print report in html format""" | 
|  | 298 | # Handle metadata | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 299 | metadata = metadata_diff(data[id_comp].metadata, data[-1].metadata) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 300 |  | 
|  | 301 | # Generate list of tests | 
|  | 302 | tests = [] | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 303 | for test in data[-1].results['tests'].keys(): | 
|  | 304 | test_r = data[-1].results['tests'][test] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 305 | new_test = {'name': test_r['name'], | 
|  | 306 | 'description': test_r['description'], | 
|  | 307 | 'status': test_r['status'], | 
|  | 308 | 'measurements': [], | 
|  | 309 | 'err_type': test_r.get('err_type'), | 
|  | 310 | } | 
|  | 311 | # Limit length of err output shown | 
|  | 312 | if 'message' in test_r: | 
|  | 313 | lines = test_r['message'].splitlines() | 
|  | 314 | if len(lines) > 20: | 
|  | 315 | new_test['message'] = '...\n' + '\n'.join(lines[-20:]) | 
|  | 316 | else: | 
|  | 317 | new_test['message'] = test_r['message'] | 
|  | 318 |  | 
|  | 319 |  | 
|  | 320 | # Generate the list of measurements | 
|  | 321 | for meas in test_r['measurements'].keys(): | 
|  | 322 | meas_r = test_r['measurements'][meas] | 
|  | 323 | meas_type = 'time' if meas_r['type'] == 'sysres' else 'size' | 
|  | 324 | new_meas = {'name': meas_r['name'], | 
|  | 325 | 'legend': meas_r['legend'], | 
|  | 326 | 'description': meas_r['name'] + ' ' + meas_type, | 
|  | 327 | } | 
|  | 328 | samples = [] | 
|  | 329 |  | 
|  | 330 | # Run through all revisions in our data | 
|  | 331 | for meta, test_data in data: | 
|  | 332 | if (not test in test_data['tests'] or | 
|  | 333 | not meas in test_data['tests'][test]['measurements']): | 
|  | 334 | samples.append(measurement_stats(None)) | 
|  | 335 | continue | 
|  | 336 | test_i = test_data['tests'][test] | 
|  | 337 | meas_i = test_i['measurements'][meas] | 
|  | 338 | commit_num = get_data_item(meta, 'layers.meta.commit_count') | 
|  | 339 | samples.append(measurement_stats(meas_i)) | 
|  | 340 | samples[-1]['commit_num'] = commit_num | 
|  | 341 |  | 
|  | 342 | absdiff = samples[-1]['val_cls'](samples[-1]['mean'] - samples[id_comp]['mean']) | 
| Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 343 | reldiff = absdiff * 100 / samples[id_comp]['mean'] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 344 | new_meas['absdiff'] = absdiff | 
|  | 345 | new_meas['absdiff_str'] = str(absdiff) if absdiff < 0 else '+' + str(absdiff) | 
| Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 346 | new_meas['reldiff'] = reldiff | 
|  | 347 | new_meas['reldiff_str'] = "{:+.1f} %".format(reldiff) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 348 | new_meas['samples'] = samples | 
|  | 349 | new_meas['value'] = samples[-1] | 
|  | 350 | new_meas['value_type'] = samples[-1]['val_cls'] | 
|  | 351 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 352 | # Compare buildstats | 
|  | 353 | bs_key = test + '.' + meas | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 354 | rev = str(metadata['commit_num']['value']) | 
|  | 355 | comp_rev = str(metadata['commit_num']['value_old']) | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 356 | if (rev in buildstats and bs_key in buildstats[rev] and | 
|  | 357 | comp_rev in buildstats and bs_key in buildstats[comp_rev]): | 
|  | 358 | new_meas['buildstats'] = BSSummary(buildstats[comp_rev][bs_key], | 
|  | 359 | buildstats[rev][bs_key]) | 
|  | 360 |  | 
|  | 361 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 362 | new_test['measurements'].append(new_meas) | 
|  | 363 | tests.append(new_test) | 
|  | 364 |  | 
|  | 365 | # Chart options | 
|  | 366 | chart_opts = {'haxis': {'min': get_data_item(data[0][0], 'layers.meta.commit_count'), | 
|  | 367 | 'max': get_data_item(data[-1][0], 'layers.meta.commit_count')} | 
|  | 368 | } | 
|  | 369 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 370 | print(html.template.render(title="Build Perf Test Report", | 
|  | 371 | metadata=metadata, test_data=tests, | 
|  | 372 | chart_opts=chart_opts)) | 
|  | 373 |  | 
|  | 374 |  | 
|  | 375 | def get_buildstats(repo, notes_ref, revs, outdir=None): | 
|  | 376 | """Get the buildstats from git notes""" | 
|  | 377 | full_ref = 'refs/notes/' + notes_ref | 
|  | 378 | if not repo.rev_parse(full_ref): | 
|  | 379 | log.error("No buildstats found, please try running " | 
|  | 380 | "'git fetch origin %s:%s' to fetch them from the remote", | 
|  | 381 | full_ref, full_ref) | 
|  | 382 | return | 
|  | 383 |  | 
|  | 384 | missing = False | 
|  | 385 | buildstats = {} | 
|  | 386 | log.info("Parsing buildstats from 'refs/notes/%s'", notes_ref) | 
|  | 387 | for rev in revs: | 
|  | 388 | buildstats[rev.commit_number] = {} | 
|  | 389 | log.debug('Dumping buildstats for %s (%s)', rev.commit_number, | 
|  | 390 | rev.commit) | 
|  | 391 | for tag in rev.tags: | 
|  | 392 | log.debug('    %s', tag) | 
|  | 393 | try: | 
|  | 394 | bs_all = json.loads(repo.run_cmd(['notes', '--ref', notes_ref, | 
|  | 395 | 'show', tag + '^0'])) | 
|  | 396 | except GitError: | 
|  | 397 | log.warning("Buildstats not found for %s", tag) | 
|  | 398 | bs_all = {} | 
|  | 399 | missing = True | 
|  | 400 |  | 
|  | 401 | for measurement, bs in bs_all.items(): | 
|  | 402 | # Write out onto disk | 
|  | 403 | if outdir: | 
|  | 404 | tag_base, run_id = tag.rsplit('/', 1) | 
|  | 405 | tag_base = tag_base.replace('/', '_') | 
|  | 406 | bs_dir = os.path.join(outdir, measurement, tag_base) | 
|  | 407 | if not os.path.exists(bs_dir): | 
|  | 408 | os.makedirs(bs_dir) | 
|  | 409 | with open(os.path.join(bs_dir, run_id + '.json'), 'w') as f: | 
|  | 410 | json.dump(bs, f, indent=2) | 
|  | 411 |  | 
|  | 412 | # Read buildstats into a dict | 
|  | 413 | _bs = BuildStats.from_json(bs) | 
|  | 414 | if measurement not in buildstats[rev.commit_number]: | 
|  | 415 | buildstats[rev.commit_number][measurement] = _bs | 
|  | 416 | else: | 
|  | 417 | buildstats[rev.commit_number][measurement].aggregate(_bs) | 
|  | 418 |  | 
|  | 419 | if missing: | 
|  | 420 | log.info("Buildstats were missing for some test runs, please " | 
|  | 421 | "run 'git fetch origin %s:%s' and try again", | 
|  | 422 | full_ref, full_ref) | 
|  | 423 |  | 
|  | 424 | return buildstats | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 425 |  | 
|  | 426 |  | 
|  | 427 | def auto_args(repo, args): | 
|  | 428 | """Guess arguments, if not defined by the user""" | 
|  | 429 | # Get the latest commit in the repo | 
|  | 430 | log.debug("Guessing arguments from the latest commit") | 
|  | 431 | msg = repo.run_cmd(['log', '-1', '--branches', '--remotes', '--format=%b']) | 
|  | 432 | for line in msg.splitlines(): | 
|  | 433 | split = line.split(':', 1) | 
|  | 434 | if len(split) != 2: | 
|  | 435 | continue | 
|  | 436 |  | 
|  | 437 | key = split[0] | 
|  | 438 | val = split[1].strip() | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 439 | if key == 'hostname' and not args.hostname: | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 440 | log.debug("Using hostname %s", val) | 
|  | 441 | args.hostname = val | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 442 | elif key == 'branch' and not args.branch: | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 443 | log.debug("Using branch %s", val) | 
|  | 444 | args.branch = val | 
|  | 445 |  | 
|  | 446 |  | 
|  | 447 | def parse_args(argv): | 
|  | 448 | """Parse command line arguments""" | 
|  | 449 | description = """ | 
|  | 450 | Examine build performance test results from a Git repository""" | 
|  | 451 | parser = argparse.ArgumentParser( | 
|  | 452 | formatter_class=argparse.ArgumentDefaultsHelpFormatter, | 
|  | 453 | description=description) | 
|  | 454 |  | 
|  | 455 | parser.add_argument('--debug', '-d', action='store_true', | 
|  | 456 | help="Verbose logging") | 
|  | 457 | parser.add_argument('--repo', '-r', required=True, | 
|  | 458 | help="Results repository (local git clone)") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 459 | parser.add_argument('--list', '-l', action='count', | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 460 | help="List available test runs") | 
|  | 461 | parser.add_argument('--html', action='store_true', | 
|  | 462 | help="Generate report in html format") | 
|  | 463 | group = parser.add_argument_group('Tag and revision') | 
|  | 464 | group.add_argument('--tag-name', '-t', | 
|  | 465 | default='{hostname}/{branch}/{machine}/{commit_number}-g{commit}/{tag_number}', | 
|  | 466 | help="Tag name (pattern) for finding results") | 
|  | 467 | group.add_argument('--hostname', '-H') | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 468 | group.add_argument('--branch', '-B', default='master', help="Branch to find commit in") | 
|  | 469 | group.add_argument('--branch2', help="Branch to find comparision revisions in") | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 470 | group.add_argument('--machine', default='qemux86') | 
|  | 471 | group.add_argument('--history-length', default=25, type=int, | 
|  | 472 | help="Number of tested revisions to plot in html report") | 
|  | 473 | group.add_argument('--commit', | 
|  | 474 | help="Revision to search for") | 
|  | 475 | group.add_argument('--commit-number', | 
|  | 476 | help="Revision number to search for, redundant if " | 
|  | 477 | "--commit is specified") | 
|  | 478 | group.add_argument('--commit2', | 
|  | 479 | help="Revision to compare with") | 
|  | 480 | group.add_argument('--commit-number2', | 
|  | 481 | help="Revision number to compare with, redundant if " | 
|  | 482 | "--commit2 is specified") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 483 | parser.add_argument('--dump-buildstats', nargs='?', const='.', | 
|  | 484 | help="Dump buildstats of the tests") | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 485 |  | 
|  | 486 | return parser.parse_args(argv) | 
|  | 487 |  | 
|  | 488 |  | 
|  | 489 | def main(argv=None): | 
|  | 490 | """Script entry point""" | 
|  | 491 | args = parse_args(argv) | 
|  | 492 | if args.debug: | 
|  | 493 | log.setLevel(logging.DEBUG) | 
|  | 494 |  | 
|  | 495 | repo = GitRepo(args.repo) | 
|  | 496 |  | 
|  | 497 | if args.list: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 498 | list_test_revs(repo, args.tag_name, args.list, hostname=args.hostname) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 499 | return 0 | 
|  | 500 |  | 
|  | 501 | # Determine hostname which to use | 
|  | 502 | if not args.hostname: | 
|  | 503 | auto_args(repo, args) | 
|  | 504 |  | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 505 | revs = gitarchive.get_test_revs(log, repo, args.tag_name, hostname=args.hostname, | 
|  | 506 | branch=args.branch, machine=args.machine) | 
|  | 507 | if args.branch2: | 
|  | 508 | revs2 = gitarchive.get_test_revs(log, repo, args.tag_name, hostname=args.hostname, | 
|  | 509 | branch=args.branch2, machine=args.machine) | 
|  | 510 | if not len(revs2): | 
|  | 511 | log.error("No revisions found to compare against") | 
|  | 512 | return 1 | 
|  | 513 | if not len(revs): | 
|  | 514 | log.error("No revision to report on found") | 
|  | 515 | return 1 | 
|  | 516 | else: | 
|  | 517 | if len(revs) < 2: | 
|  | 518 | log.error("Only %d tester revisions found, unable to generate report" % len(revs)) | 
|  | 519 | return 1 | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 520 |  | 
|  | 521 | # Pick revisions | 
|  | 522 | if args.commit: | 
|  | 523 | if args.commit_number: | 
|  | 524 | log.warning("Ignoring --commit-number as --commit was specified") | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 525 | index1 = gitarchive.rev_find(revs, 'commit', args.commit) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 526 | elif args.commit_number: | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 527 | index1 = gitarchive.rev_find(revs, 'commit_number', args.commit_number) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 528 | else: | 
|  | 529 | index1 = len(revs) - 1 | 
|  | 530 |  | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 531 | if args.branch2: | 
|  | 532 | revs2.append(revs[index1]) | 
|  | 533 | index1 = len(revs2) - 1 | 
|  | 534 | revs = revs2 | 
|  | 535 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 536 | if args.commit2: | 
|  | 537 | if args.commit_number2: | 
|  | 538 | log.warning("Ignoring --commit-number2 as --commit2 was specified") | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 539 | index2 = gitarchive.rev_find(revs, 'commit', args.commit2) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 540 | elif args.commit_number2: | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 541 | index2 = gitarchive.rev_find(revs, 'commit_number', args.commit_number2) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 542 | else: | 
|  | 543 | if index1 > 0: | 
|  | 544 | index2 = index1 - 1 | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 545 | # Find the closest matching commit number for comparision | 
|  | 546 | # In future we could check the commit is a common ancestor and | 
|  | 547 | # continue back if not but this good enough for now | 
|  | 548 | while index2 > 0 and revs[index2].commit_number > revs[index1].commit_number: | 
|  | 549 | index2 = index2 - 1 | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 550 | else: | 
|  | 551 | log.error("Unable to determine the other commit, use " | 
|  | 552 | "--commit2 or --commit-number2 to specify it") | 
|  | 553 | return 1 | 
|  | 554 |  | 
|  | 555 | index_l = min(index1, index2) | 
|  | 556 | index_r = max(index1, index2) | 
|  | 557 |  | 
|  | 558 | rev_l = revs[index_l] | 
|  | 559 | rev_r = revs[index_r] | 
|  | 560 | log.debug("Using 'left' revision %s (%s), %s test runs:\n    %s", | 
|  | 561 | rev_l.commit_number, rev_l.commit, len(rev_l.tags), | 
|  | 562 | '\n    '.join(rev_l.tags)) | 
|  | 563 | log.debug("Using 'right' revision %s (%s), %s test runs:\n    %s", | 
|  | 564 | rev_r.commit_number, rev_r.commit, len(rev_r.tags), | 
|  | 565 | '\n    '.join(rev_r.tags)) | 
|  | 566 |  | 
|  | 567 | # Check report format used in the repo (assume all reports in the same fmt) | 
|  | 568 | xml = is_xml_format(repo, revs[index_r].tags[-1]) | 
|  | 569 |  | 
|  | 570 | if args.html: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 571 | index_0 = max(0, min(index_l, index_r - args.history_length)) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 572 | rev_range = range(index_0, index_r + 1) | 
|  | 573 | else: | 
|  | 574 | # We do not need range of commits for text report (no graphs) | 
|  | 575 | index_0 = index_l | 
|  | 576 | rev_range = (index_l, index_r) | 
|  | 577 |  | 
|  | 578 | # Read raw data | 
|  | 579 | log.debug("Reading %d revisions, starting from %s (%s)", | 
|  | 580 | len(rev_range), revs[index_0].commit_number, revs[index_0].commit) | 
|  | 581 | raw_data = [read_results(repo, revs[i].tags, xml) for i in rev_range] | 
|  | 582 |  | 
|  | 583 | data = [] | 
|  | 584 | for raw_m, raw_d in raw_data: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 585 | data.append(AggregateTestData(aggregate_metadata(raw_m), | 
|  | 586 | aggregate_data(raw_d))) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 587 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 588 | # Read buildstats only when needed | 
|  | 589 | buildstats = None | 
|  | 590 | if args.dump_buildstats or args.html: | 
|  | 591 | outdir = 'oe-build-perf-buildstats' if args.dump_buildstats else None | 
|  | 592 | notes_ref = 'buildstats/{}/{}/{}'.format(args.hostname, args.branch, | 
|  | 593 | args.machine) | 
|  | 594 | buildstats = get_buildstats(repo, notes_ref, [rev_l, rev_r], outdir) | 
|  | 595 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 596 | # Print report | 
|  | 597 | if not args.html: | 
| Brad Bishop | 0011132 | 2018-04-01 22:23:53 -0400 | [diff] [blame] | 598 | print_diff_report(data[0].metadata, data[0].results, | 
|  | 599 | data[1].metadata, data[1].results) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 600 | else: | 
| Brad Bishop | 0011132 | 2018-04-01 22:23:53 -0400 | [diff] [blame] | 601 | # Re-map 'left' list index to the data table where index_0 maps to 0 | 
|  | 602 | print_html_report(data, index_l - index_0, buildstats) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 603 |  | 
|  | 604 | return 0 | 
|  | 605 |  | 
|  | 606 | if __name__ == "__main__": | 
|  | 607 | sys.exit(main()) |