| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 1 | #!/usr/bin/python3 | 
|  | 2 | # | 
|  | 3 | # Examine build performance test results | 
|  | 4 | # | 
|  | 5 | # Copyright (c) 2017, Intel Corporation. | 
|  | 6 | # | 
|  | 7 | # This program is free software; you can redistribute it and/or modify it | 
|  | 8 | # under the terms and conditions of the GNU General Public License, | 
|  | 9 | # version 2, as published by the Free Software Foundation. | 
|  | 10 | # | 
|  | 11 | # This program is distributed in the hope it will be useful, but WITHOUT | 
|  | 12 | # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | 
|  | 13 | # FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for | 
|  | 14 | # more details. | 
|  | 15 | # | 
|  | 16 | import argparse | 
|  | 17 | import json | 
|  | 18 | import logging | 
|  | 19 | import os | 
|  | 20 | import re | 
|  | 21 | import sys | 
|  | 22 | from collections import namedtuple, OrderedDict | 
|  | 23 | from operator import attrgetter | 
|  | 24 | from xml.etree import ElementTree as ET | 
|  | 25 |  | 
|  | 26 | # Import oe libs | 
|  | 27 | scripts_path = os.path.dirname(os.path.realpath(__file__)) | 
|  | 28 | sys.path.append(os.path.join(scripts_path, 'lib')) | 
|  | 29 | import scriptpath | 
|  | 30 | from build_perf import print_table | 
|  | 31 | from build_perf.report import (metadata_xml_to_json, results_xml_to_json, | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 32 | aggregate_data, aggregate_metadata, measurement_stats, | 
|  | 33 | AggregateTestData) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 34 | from build_perf import html | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 35 | from buildstats import BuildStats, diff_buildstats, BSVerDiff | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 36 |  | 
|  | 37 | scriptpath.add_oe_lib_path() | 
|  | 38 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 39 | from oeqa.utils.git import GitRepo, GitError | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 40 | import oeqa.utils.gitarchive as gitarchive | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 41 |  | 
|  | 42 |  | 
|  | 43 | # Setup logging | 
|  | 44 | logging.basicConfig(level=logging.INFO, format="%(levelname)s: %(message)s") | 
|  | 45 | log = logging.getLogger('oe-build-perf-report') | 
|  | 46 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 47 | def list_test_revs(repo, tag_name, verbosity, **kwargs): | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 48 | """Get list of all tested revisions""" | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 49 | valid_kwargs = dict([(k, v) for k, v in kwargs.items() if v is not None]) | 
|  | 50 |  | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 51 | fields, revs = gitarchive.get_test_runs(log, repo, tag_name, **valid_kwargs) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 52 | ignore_fields = ['tag_number'] | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 53 | if verbosity < 2: | 
|  | 54 | extra_fields = ['COMMITS', 'TEST RUNS'] | 
|  | 55 | ignore_fields.extend(['commit_number', 'commit']) | 
|  | 56 | else: | 
|  | 57 | extra_fields = ['TEST RUNS'] | 
|  | 58 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 59 | print_fields = [i for i, f in enumerate(fields) if f not in ignore_fields] | 
|  | 60 |  | 
|  | 61 | # Sort revs | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 62 | rows = [[fields[i].upper() for i in print_fields] + extra_fields] | 
|  | 63 |  | 
|  | 64 | prev = [''] * len(print_fields) | 
|  | 65 | prev_commit = None | 
|  | 66 | commit_cnt = 0 | 
|  | 67 | commit_field = fields.index('commit') | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 68 | for rev in revs: | 
|  | 69 | # Only use fields that we want to print | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 70 | cols = [rev[i] for i in print_fields] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 71 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 72 |  | 
|  | 73 | if cols != prev: | 
|  | 74 | commit_cnt = 1 | 
|  | 75 | test_run_cnt = 1 | 
|  | 76 | new_row = [''] * (len(print_fields) + len(extra_fields)) | 
|  | 77 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 78 | for i in print_fields: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 79 | if cols[i] != prev[i]: | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 80 | break | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 81 | new_row[i:-len(extra_fields)] = cols[i:] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 82 | rows.append(new_row) | 
|  | 83 | else: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 84 | if rev[commit_field] != prev_commit: | 
|  | 85 | commit_cnt += 1 | 
|  | 86 | test_run_cnt += 1 | 
|  | 87 |  | 
|  | 88 | if verbosity < 2: | 
|  | 89 | new_row[-2] = commit_cnt | 
|  | 90 | new_row[-1] = test_run_cnt | 
|  | 91 | prev = cols | 
|  | 92 | prev_commit = rev[commit_field] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 93 |  | 
|  | 94 | print_table(rows) | 
|  | 95 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 96 | def is_xml_format(repo, commit): | 
|  | 97 | """Check if the commit contains xml (or json) data""" | 
|  | 98 | if repo.rev_parse(commit + ':results.xml'): | 
|  | 99 | log.debug("Detected report in xml format in %s", commit) | 
|  | 100 | return True | 
|  | 101 | else: | 
|  | 102 | log.debug("No xml report in %s, assuming json formatted results", commit) | 
|  | 103 | return False | 
|  | 104 |  | 
|  | 105 | def read_results(repo, tags, xml=True): | 
|  | 106 | """Read result files from repo""" | 
|  | 107 |  | 
|  | 108 | def parse_xml_stream(data): | 
|  | 109 | """Parse multiple concatenated XML objects""" | 
|  | 110 | objs = [] | 
|  | 111 | xml_d = "" | 
|  | 112 | for line in data.splitlines(): | 
|  | 113 | if xml_d and line.startswith('<?xml version='): | 
|  | 114 | objs.append(ET.fromstring(xml_d)) | 
|  | 115 | xml_d = line | 
|  | 116 | else: | 
|  | 117 | xml_d += line | 
|  | 118 | objs.append(ET.fromstring(xml_d)) | 
|  | 119 | return objs | 
|  | 120 |  | 
|  | 121 | def parse_json_stream(data): | 
|  | 122 | """Parse multiple concatenated JSON objects""" | 
|  | 123 | objs = [] | 
|  | 124 | json_d = "" | 
|  | 125 | for line in data.splitlines(): | 
|  | 126 | if line == '}{': | 
|  | 127 | json_d += '}' | 
|  | 128 | objs.append(json.loads(json_d, object_pairs_hook=OrderedDict)) | 
|  | 129 | json_d = '{' | 
|  | 130 | else: | 
|  | 131 | json_d += line | 
|  | 132 | objs.append(json.loads(json_d, object_pairs_hook=OrderedDict)) | 
|  | 133 | return objs | 
|  | 134 |  | 
|  | 135 | num_revs = len(tags) | 
|  | 136 |  | 
|  | 137 | # Optimize by reading all data with one git command | 
|  | 138 | log.debug("Loading raw result data from %d tags, %s...", num_revs, tags[0]) | 
|  | 139 | if xml: | 
|  | 140 | git_objs = [tag + ':metadata.xml' for tag in tags] + [tag + ':results.xml' for tag in tags] | 
|  | 141 | data = parse_xml_stream(repo.run_cmd(['show'] + git_objs + ['--'])) | 
|  | 142 | return ([metadata_xml_to_json(e) for e in data[0:num_revs]], | 
|  | 143 | [results_xml_to_json(e) for e in data[num_revs:]]) | 
|  | 144 | else: | 
|  | 145 | git_objs = [tag + ':metadata.json' for tag in tags] + [tag + ':results.json' for tag in tags] | 
|  | 146 | data = parse_json_stream(repo.run_cmd(['show'] + git_objs + ['--'])) | 
|  | 147 | return data[0:num_revs], data[num_revs:] | 
|  | 148 |  | 
|  | 149 |  | 
|  | 150 | def get_data_item(data, key): | 
|  | 151 | """Nested getitem lookup""" | 
|  | 152 | for k in key.split('.'): | 
|  | 153 | data = data[k] | 
|  | 154 | return data | 
|  | 155 |  | 
|  | 156 |  | 
|  | 157 | def metadata_diff(metadata_l, metadata_r): | 
|  | 158 | """Prepare a metadata diff for printing""" | 
|  | 159 | keys = [('Hostname', 'hostname', 'hostname'), | 
|  | 160 | ('Branch', 'branch', 'layers.meta.branch'), | 
|  | 161 | ('Commit number', 'commit_num', 'layers.meta.commit_count'), | 
|  | 162 | ('Commit', 'commit', 'layers.meta.commit'), | 
|  | 163 | ('Number of test runs', 'testrun_count', 'testrun_count') | 
|  | 164 | ] | 
|  | 165 |  | 
|  | 166 | def _metadata_diff(key): | 
|  | 167 | """Diff metadata from two test reports""" | 
|  | 168 | try: | 
|  | 169 | val1 = get_data_item(metadata_l, key) | 
|  | 170 | except KeyError: | 
|  | 171 | val1 = '(N/A)' | 
|  | 172 | try: | 
|  | 173 | val2 = get_data_item(metadata_r, key) | 
|  | 174 | except KeyError: | 
|  | 175 | val2 = '(N/A)' | 
|  | 176 | return val1, val2 | 
|  | 177 |  | 
|  | 178 | metadata = OrderedDict() | 
|  | 179 | for title, key, key_json in keys: | 
|  | 180 | value_l, value_r = _metadata_diff(key_json) | 
|  | 181 | metadata[key] = {'title': title, | 
|  | 182 | 'value_old': value_l, | 
|  | 183 | 'value': value_r} | 
|  | 184 | return metadata | 
|  | 185 |  | 
|  | 186 |  | 
|  | 187 | def print_diff_report(metadata_l, data_l, metadata_r, data_r): | 
|  | 188 | """Print differences between two data sets""" | 
|  | 189 |  | 
|  | 190 | # First, print general metadata | 
|  | 191 | print("\nTEST METADATA:\n==============") | 
|  | 192 | meta_diff = metadata_diff(metadata_l, metadata_r) | 
|  | 193 | rows = [] | 
|  | 194 | row_fmt = ['{:{wid}} ', '{:<{wid}}   ', '{:<{wid}}'] | 
|  | 195 | rows = [['', 'CURRENT COMMIT', 'COMPARING WITH']] | 
|  | 196 | for key, val in meta_diff.items(): | 
|  | 197 | # Shorten commit hashes | 
|  | 198 | if key == 'commit': | 
|  | 199 | rows.append([val['title'] + ':', val['value'][:20], val['value_old'][:20]]) | 
|  | 200 | else: | 
|  | 201 | rows.append([val['title'] + ':', val['value'], val['value_old']]) | 
|  | 202 | print_table(rows, row_fmt) | 
|  | 203 |  | 
|  | 204 |  | 
|  | 205 | # Print test results | 
|  | 206 | print("\nTEST RESULTS:\n=============") | 
|  | 207 |  | 
|  | 208 | tests = list(data_l['tests'].keys()) | 
|  | 209 | # Append tests that are only present in 'right' set | 
|  | 210 | tests += [t for t in list(data_r['tests'].keys()) if t not in tests] | 
|  | 211 |  | 
|  | 212 | # Prepare data to be printed | 
|  | 213 | rows = [] | 
|  | 214 | row_fmt = ['{:8}', '{:{wid}}', '{:{wid}}', '  {:>{wid}}', ' {:{wid}} ', '{:{wid}}', | 
|  | 215 | '  {:>{wid}}', '  {:>{wid}}'] | 
|  | 216 | num_cols = len(row_fmt) | 
|  | 217 | for test in tests: | 
|  | 218 | test_l = data_l['tests'][test] if test in data_l['tests'] else None | 
|  | 219 | test_r = data_r['tests'][test] if test in data_r['tests'] else None | 
|  | 220 | pref = ' ' | 
|  | 221 | if test_l is None: | 
|  | 222 | pref = '+' | 
|  | 223 | elif test_r is None: | 
|  | 224 | pref = '-' | 
|  | 225 | descr = test_l['description'] if test_l else test_r['description'] | 
|  | 226 | heading = "{} {}: {}".format(pref, test, descr) | 
|  | 227 |  | 
|  | 228 | rows.append([heading]) | 
|  | 229 |  | 
|  | 230 | # Generate the list of measurements | 
|  | 231 | meas_l = test_l['measurements'] if test_l else {} | 
|  | 232 | meas_r = test_r['measurements'] if test_r else {} | 
|  | 233 | measurements = list(meas_l.keys()) | 
|  | 234 | measurements += [m for m in list(meas_r.keys()) if m not in measurements] | 
|  | 235 |  | 
|  | 236 | for meas in measurements: | 
|  | 237 | m_pref = ' ' | 
|  | 238 | if meas in meas_l: | 
|  | 239 | stats_l = measurement_stats(meas_l[meas], 'l.') | 
|  | 240 | else: | 
|  | 241 | stats_l = measurement_stats(None, 'l.') | 
|  | 242 | m_pref = '+' | 
|  | 243 | if meas in meas_r: | 
|  | 244 | stats_r = measurement_stats(meas_r[meas], 'r.') | 
|  | 245 | else: | 
|  | 246 | stats_r = measurement_stats(None, 'r.') | 
|  | 247 | m_pref = '-' | 
|  | 248 | stats = stats_l.copy() | 
|  | 249 | stats.update(stats_r) | 
|  | 250 |  | 
|  | 251 | absdiff = stats['val_cls'](stats['r.mean'] - stats['l.mean']) | 
|  | 252 | reldiff = "{:+.1f} %".format(absdiff * 100 / stats['l.mean']) | 
|  | 253 | if stats['r.mean'] > stats['l.mean']: | 
|  | 254 | absdiff = '+' + str(absdiff) | 
|  | 255 | else: | 
|  | 256 | absdiff = str(absdiff) | 
|  | 257 | rows.append(['', m_pref, stats['name'] + ' ' + stats['quantity'], | 
|  | 258 | str(stats['l.mean']), '->', str(stats['r.mean']), | 
|  | 259 | absdiff, reldiff]) | 
|  | 260 | rows.append([''] * num_cols) | 
|  | 261 |  | 
|  | 262 | print_table(rows, row_fmt) | 
|  | 263 |  | 
|  | 264 | print() | 
|  | 265 |  | 
|  | 266 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 267 | class BSSummary(object): | 
|  | 268 | def __init__(self, bs1, bs2): | 
|  | 269 | self.tasks = {'count': bs2.num_tasks, | 
|  | 270 | 'change': '{:+d}'.format(bs2.num_tasks - bs1.num_tasks)} | 
|  | 271 | self.top_consumer = None | 
|  | 272 | self.top_decrease = None | 
|  | 273 | self.top_increase = None | 
|  | 274 | self.ver_diff = OrderedDict() | 
|  | 275 |  | 
|  | 276 | tasks_diff = diff_buildstats(bs1, bs2, 'cputime') | 
|  | 277 |  | 
|  | 278 | # Get top consumers of resources | 
|  | 279 | tasks_diff = sorted(tasks_diff, key=attrgetter('value2')) | 
|  | 280 | self.top_consumer = tasks_diff[-5:] | 
|  | 281 |  | 
|  | 282 | # Get biggest increase and decrease in resource usage | 
|  | 283 | tasks_diff = sorted(tasks_diff, key=attrgetter('absdiff')) | 
|  | 284 | self.top_decrease = tasks_diff[0:5] | 
|  | 285 | self.top_increase = tasks_diff[-5:] | 
|  | 286 |  | 
|  | 287 | # Compare recipe versions and prepare data for display | 
|  | 288 | ver_diff = BSVerDiff(bs1, bs2) | 
|  | 289 | if ver_diff: | 
|  | 290 | if ver_diff.new: | 
|  | 291 | self.ver_diff['New recipes'] = [(n, r.evr) for n, r in ver_diff.new.items()] | 
|  | 292 | if ver_diff.dropped: | 
|  | 293 | self.ver_diff['Dropped recipes'] = [(n, r.evr) for n, r in ver_diff.dropped.items()] | 
|  | 294 | if ver_diff.echanged: | 
|  | 295 | self.ver_diff['Epoch changed'] = [(n, "{} → {}".format(r.left.evr, r.right.evr)) for n, r in ver_diff.echanged.items()] | 
|  | 296 | if ver_diff.vchanged: | 
|  | 297 | self.ver_diff['Version changed'] = [(n, "{} → {}".format(r.left.version, r.right.version)) for n, r in ver_diff.vchanged.items()] | 
|  | 298 | if ver_diff.rchanged: | 
|  | 299 | self.ver_diff['Revision changed'] = [(n, "{} → {}".format(r.left.evr, r.right.evr)) for n, r in ver_diff.rchanged.items()] | 
|  | 300 |  | 
|  | 301 |  | 
|  | 302 | def print_html_report(data, id_comp, buildstats): | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 303 | """Print report in html format""" | 
|  | 304 | # Handle metadata | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 305 | metadata = metadata_diff(data[id_comp].metadata, data[-1].metadata) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 306 |  | 
|  | 307 | # Generate list of tests | 
|  | 308 | tests = [] | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 309 | for test in data[-1].results['tests'].keys(): | 
|  | 310 | test_r = data[-1].results['tests'][test] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 311 | new_test = {'name': test_r['name'], | 
|  | 312 | 'description': test_r['description'], | 
|  | 313 | 'status': test_r['status'], | 
|  | 314 | 'measurements': [], | 
|  | 315 | 'err_type': test_r.get('err_type'), | 
|  | 316 | } | 
|  | 317 | # Limit length of err output shown | 
|  | 318 | if 'message' in test_r: | 
|  | 319 | lines = test_r['message'].splitlines() | 
|  | 320 | if len(lines) > 20: | 
|  | 321 | new_test['message'] = '...\n' + '\n'.join(lines[-20:]) | 
|  | 322 | else: | 
|  | 323 | new_test['message'] = test_r['message'] | 
|  | 324 |  | 
|  | 325 |  | 
|  | 326 | # Generate the list of measurements | 
|  | 327 | for meas in test_r['measurements'].keys(): | 
|  | 328 | meas_r = test_r['measurements'][meas] | 
|  | 329 | meas_type = 'time' if meas_r['type'] == 'sysres' else 'size' | 
|  | 330 | new_meas = {'name': meas_r['name'], | 
|  | 331 | 'legend': meas_r['legend'], | 
|  | 332 | 'description': meas_r['name'] + ' ' + meas_type, | 
|  | 333 | } | 
|  | 334 | samples = [] | 
|  | 335 |  | 
|  | 336 | # Run through all revisions in our data | 
|  | 337 | for meta, test_data in data: | 
|  | 338 | if (not test in test_data['tests'] or | 
|  | 339 | not meas in test_data['tests'][test]['measurements']): | 
|  | 340 | samples.append(measurement_stats(None)) | 
|  | 341 | continue | 
|  | 342 | test_i = test_data['tests'][test] | 
|  | 343 | meas_i = test_i['measurements'][meas] | 
|  | 344 | commit_num = get_data_item(meta, 'layers.meta.commit_count') | 
|  | 345 | samples.append(measurement_stats(meas_i)) | 
|  | 346 | samples[-1]['commit_num'] = commit_num | 
|  | 347 |  | 
|  | 348 | absdiff = samples[-1]['val_cls'](samples[-1]['mean'] - samples[id_comp]['mean']) | 
| Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 349 | reldiff = absdiff * 100 / samples[id_comp]['mean'] | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 350 | new_meas['absdiff'] = absdiff | 
|  | 351 | new_meas['absdiff_str'] = str(absdiff) if absdiff < 0 else '+' + str(absdiff) | 
| Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 352 | new_meas['reldiff'] = reldiff | 
|  | 353 | new_meas['reldiff_str'] = "{:+.1f} %".format(reldiff) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 354 | new_meas['samples'] = samples | 
|  | 355 | new_meas['value'] = samples[-1] | 
|  | 356 | new_meas['value_type'] = samples[-1]['val_cls'] | 
|  | 357 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 358 | # Compare buildstats | 
|  | 359 | bs_key = test + '.' + meas | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 360 | rev = str(metadata['commit_num']['value']) | 
|  | 361 | comp_rev = str(metadata['commit_num']['value_old']) | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 362 | if (rev in buildstats and bs_key in buildstats[rev] and | 
|  | 363 | comp_rev in buildstats and bs_key in buildstats[comp_rev]): | 
|  | 364 | new_meas['buildstats'] = BSSummary(buildstats[comp_rev][bs_key], | 
|  | 365 | buildstats[rev][bs_key]) | 
|  | 366 |  | 
|  | 367 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 368 | new_test['measurements'].append(new_meas) | 
|  | 369 | tests.append(new_test) | 
|  | 370 |  | 
|  | 371 | # Chart options | 
|  | 372 | chart_opts = {'haxis': {'min': get_data_item(data[0][0], 'layers.meta.commit_count'), | 
|  | 373 | 'max': get_data_item(data[-1][0], 'layers.meta.commit_count')} | 
|  | 374 | } | 
|  | 375 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 376 | print(html.template.render(title="Build Perf Test Report", | 
|  | 377 | metadata=metadata, test_data=tests, | 
|  | 378 | chart_opts=chart_opts)) | 
|  | 379 |  | 
|  | 380 |  | 
|  | 381 | def get_buildstats(repo, notes_ref, revs, outdir=None): | 
|  | 382 | """Get the buildstats from git notes""" | 
|  | 383 | full_ref = 'refs/notes/' + notes_ref | 
|  | 384 | if not repo.rev_parse(full_ref): | 
|  | 385 | log.error("No buildstats found, please try running " | 
|  | 386 | "'git fetch origin %s:%s' to fetch them from the remote", | 
|  | 387 | full_ref, full_ref) | 
|  | 388 | return | 
|  | 389 |  | 
|  | 390 | missing = False | 
|  | 391 | buildstats = {} | 
|  | 392 | log.info("Parsing buildstats from 'refs/notes/%s'", notes_ref) | 
|  | 393 | for rev in revs: | 
|  | 394 | buildstats[rev.commit_number] = {} | 
|  | 395 | log.debug('Dumping buildstats for %s (%s)', rev.commit_number, | 
|  | 396 | rev.commit) | 
|  | 397 | for tag in rev.tags: | 
|  | 398 | log.debug('    %s', tag) | 
|  | 399 | try: | 
|  | 400 | bs_all = json.loads(repo.run_cmd(['notes', '--ref', notes_ref, | 
|  | 401 | 'show', tag + '^0'])) | 
|  | 402 | except GitError: | 
|  | 403 | log.warning("Buildstats not found for %s", tag) | 
|  | 404 | bs_all = {} | 
|  | 405 | missing = True | 
|  | 406 |  | 
|  | 407 | for measurement, bs in bs_all.items(): | 
|  | 408 | # Write out onto disk | 
|  | 409 | if outdir: | 
|  | 410 | tag_base, run_id = tag.rsplit('/', 1) | 
|  | 411 | tag_base = tag_base.replace('/', '_') | 
|  | 412 | bs_dir = os.path.join(outdir, measurement, tag_base) | 
|  | 413 | if not os.path.exists(bs_dir): | 
|  | 414 | os.makedirs(bs_dir) | 
|  | 415 | with open(os.path.join(bs_dir, run_id + '.json'), 'w') as f: | 
|  | 416 | json.dump(bs, f, indent=2) | 
|  | 417 |  | 
|  | 418 | # Read buildstats into a dict | 
|  | 419 | _bs = BuildStats.from_json(bs) | 
|  | 420 | if measurement not in buildstats[rev.commit_number]: | 
|  | 421 | buildstats[rev.commit_number][measurement] = _bs | 
|  | 422 | else: | 
|  | 423 | buildstats[rev.commit_number][measurement].aggregate(_bs) | 
|  | 424 |  | 
|  | 425 | if missing: | 
|  | 426 | log.info("Buildstats were missing for some test runs, please " | 
|  | 427 | "run 'git fetch origin %s:%s' and try again", | 
|  | 428 | full_ref, full_ref) | 
|  | 429 |  | 
|  | 430 | return buildstats | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 431 |  | 
|  | 432 |  | 
|  | 433 | def auto_args(repo, args): | 
|  | 434 | """Guess arguments, if not defined by the user""" | 
|  | 435 | # Get the latest commit in the repo | 
|  | 436 | log.debug("Guessing arguments from the latest commit") | 
|  | 437 | msg = repo.run_cmd(['log', '-1', '--branches', '--remotes', '--format=%b']) | 
|  | 438 | for line in msg.splitlines(): | 
|  | 439 | split = line.split(':', 1) | 
|  | 440 | if len(split) != 2: | 
|  | 441 | continue | 
|  | 442 |  | 
|  | 443 | key = split[0] | 
|  | 444 | val = split[1].strip() | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 445 | if key == 'hostname' and not args.hostname: | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 446 | log.debug("Using hostname %s", val) | 
|  | 447 | args.hostname = val | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 448 | elif key == 'branch' and not args.branch: | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 449 | log.debug("Using branch %s", val) | 
|  | 450 | args.branch = val | 
|  | 451 |  | 
|  | 452 |  | 
|  | 453 | def parse_args(argv): | 
|  | 454 | """Parse command line arguments""" | 
|  | 455 | description = """ | 
|  | 456 | Examine build performance test results from a Git repository""" | 
|  | 457 | parser = argparse.ArgumentParser( | 
|  | 458 | formatter_class=argparse.ArgumentDefaultsHelpFormatter, | 
|  | 459 | description=description) | 
|  | 460 |  | 
|  | 461 | parser.add_argument('--debug', '-d', action='store_true', | 
|  | 462 | help="Verbose logging") | 
|  | 463 | parser.add_argument('--repo', '-r', required=True, | 
|  | 464 | help="Results repository (local git clone)") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 465 | parser.add_argument('--list', '-l', action='count', | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 466 | help="List available test runs") | 
|  | 467 | parser.add_argument('--html', action='store_true', | 
|  | 468 | help="Generate report in html format") | 
|  | 469 | group = parser.add_argument_group('Tag and revision') | 
|  | 470 | group.add_argument('--tag-name', '-t', | 
|  | 471 | default='{hostname}/{branch}/{machine}/{commit_number}-g{commit}/{tag_number}', | 
|  | 472 | help="Tag name (pattern) for finding results") | 
|  | 473 | group.add_argument('--hostname', '-H') | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 474 | group.add_argument('--branch', '-B', default='master', help="Branch to find commit in") | 
|  | 475 | group.add_argument('--branch2', help="Branch to find comparision revisions in") | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 476 | group.add_argument('--machine', default='qemux86') | 
|  | 477 | group.add_argument('--history-length', default=25, type=int, | 
|  | 478 | help="Number of tested revisions to plot in html report") | 
|  | 479 | group.add_argument('--commit', | 
|  | 480 | help="Revision to search for") | 
|  | 481 | group.add_argument('--commit-number', | 
|  | 482 | help="Revision number to search for, redundant if " | 
|  | 483 | "--commit is specified") | 
|  | 484 | group.add_argument('--commit2', | 
|  | 485 | help="Revision to compare with") | 
|  | 486 | group.add_argument('--commit-number2', | 
|  | 487 | help="Revision number to compare with, redundant if " | 
|  | 488 | "--commit2 is specified") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 489 | parser.add_argument('--dump-buildstats', nargs='?', const='.', | 
|  | 490 | help="Dump buildstats of the tests") | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 491 |  | 
|  | 492 | return parser.parse_args(argv) | 
|  | 493 |  | 
|  | 494 |  | 
|  | 495 | def main(argv=None): | 
|  | 496 | """Script entry point""" | 
|  | 497 | args = parse_args(argv) | 
|  | 498 | if args.debug: | 
|  | 499 | log.setLevel(logging.DEBUG) | 
|  | 500 |  | 
|  | 501 | repo = GitRepo(args.repo) | 
|  | 502 |  | 
|  | 503 | if args.list: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 504 | list_test_revs(repo, args.tag_name, args.list, hostname=args.hostname) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 505 | return 0 | 
|  | 506 |  | 
|  | 507 | # Determine hostname which to use | 
|  | 508 | if not args.hostname: | 
|  | 509 | auto_args(repo, args) | 
|  | 510 |  | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 511 | revs = gitarchive.get_test_revs(log, repo, args.tag_name, hostname=args.hostname, | 
|  | 512 | branch=args.branch, machine=args.machine) | 
|  | 513 | if args.branch2: | 
|  | 514 | revs2 = gitarchive.get_test_revs(log, repo, args.tag_name, hostname=args.hostname, | 
|  | 515 | branch=args.branch2, machine=args.machine) | 
|  | 516 | if not len(revs2): | 
|  | 517 | log.error("No revisions found to compare against") | 
|  | 518 | return 1 | 
|  | 519 | if not len(revs): | 
|  | 520 | log.error("No revision to report on found") | 
|  | 521 | return 1 | 
|  | 522 | else: | 
|  | 523 | if len(revs) < 2: | 
|  | 524 | log.error("Only %d tester revisions found, unable to generate report" % len(revs)) | 
|  | 525 | return 1 | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 526 |  | 
|  | 527 | # Pick revisions | 
|  | 528 | if args.commit: | 
|  | 529 | if args.commit_number: | 
|  | 530 | log.warning("Ignoring --commit-number as --commit was specified") | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 531 | index1 = gitarchive.rev_find(revs, 'commit', args.commit) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 532 | elif args.commit_number: | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 533 | index1 = gitarchive.rev_find(revs, 'commit_number', args.commit_number) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 534 | else: | 
|  | 535 | index1 = len(revs) - 1 | 
|  | 536 |  | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 537 | if args.branch2: | 
|  | 538 | revs2.append(revs[index1]) | 
|  | 539 | index1 = len(revs2) - 1 | 
|  | 540 | revs = revs2 | 
|  | 541 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 542 | if args.commit2: | 
|  | 543 | if args.commit_number2: | 
|  | 544 | log.warning("Ignoring --commit-number2 as --commit2 was specified") | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 545 | index2 = gitarchive.rev_find(revs, 'commit', args.commit2) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 546 | elif args.commit_number2: | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 547 | index2 = gitarchive.rev_find(revs, 'commit_number', args.commit_number2) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 548 | else: | 
|  | 549 | if index1 > 0: | 
|  | 550 | index2 = index1 - 1 | 
| Andrew Geissler | 99467da | 2019-02-25 18:54:23 -0600 | [diff] [blame] | 551 | # Find the closest matching commit number for comparision | 
|  | 552 | # In future we could check the commit is a common ancestor and | 
|  | 553 | # continue back if not but this good enough for now | 
|  | 554 | while index2 > 0 and revs[index2].commit_number > revs[index1].commit_number: | 
|  | 555 | index2 = index2 - 1 | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 556 | else: | 
|  | 557 | log.error("Unable to determine the other commit, use " | 
|  | 558 | "--commit2 or --commit-number2 to specify it") | 
|  | 559 | return 1 | 
|  | 560 |  | 
|  | 561 | index_l = min(index1, index2) | 
|  | 562 | index_r = max(index1, index2) | 
|  | 563 |  | 
|  | 564 | rev_l = revs[index_l] | 
|  | 565 | rev_r = revs[index_r] | 
|  | 566 | log.debug("Using 'left' revision %s (%s), %s test runs:\n    %s", | 
|  | 567 | rev_l.commit_number, rev_l.commit, len(rev_l.tags), | 
|  | 568 | '\n    '.join(rev_l.tags)) | 
|  | 569 | log.debug("Using 'right' revision %s (%s), %s test runs:\n    %s", | 
|  | 570 | rev_r.commit_number, rev_r.commit, len(rev_r.tags), | 
|  | 571 | '\n    '.join(rev_r.tags)) | 
|  | 572 |  | 
|  | 573 | # Check report format used in the repo (assume all reports in the same fmt) | 
|  | 574 | xml = is_xml_format(repo, revs[index_r].tags[-1]) | 
|  | 575 |  | 
|  | 576 | if args.html: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 577 | index_0 = max(0, min(index_l, index_r - args.history_length)) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 578 | rev_range = range(index_0, index_r + 1) | 
|  | 579 | else: | 
|  | 580 | # We do not need range of commits for text report (no graphs) | 
|  | 581 | index_0 = index_l | 
|  | 582 | rev_range = (index_l, index_r) | 
|  | 583 |  | 
|  | 584 | # Read raw data | 
|  | 585 | log.debug("Reading %d revisions, starting from %s (%s)", | 
|  | 586 | len(rev_range), revs[index_0].commit_number, revs[index_0].commit) | 
|  | 587 | raw_data = [read_results(repo, revs[i].tags, xml) for i in rev_range] | 
|  | 588 |  | 
|  | 589 | data = [] | 
|  | 590 | for raw_m, raw_d in raw_data: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 591 | data.append(AggregateTestData(aggregate_metadata(raw_m), | 
|  | 592 | aggregate_data(raw_d))) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 593 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 594 | # Read buildstats only when needed | 
|  | 595 | buildstats = None | 
|  | 596 | if args.dump_buildstats or args.html: | 
|  | 597 | outdir = 'oe-build-perf-buildstats' if args.dump_buildstats else None | 
|  | 598 | notes_ref = 'buildstats/{}/{}/{}'.format(args.hostname, args.branch, | 
|  | 599 | args.machine) | 
|  | 600 | buildstats = get_buildstats(repo, notes_ref, [rev_l, rev_r], outdir) | 
|  | 601 |  | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 602 | # Print report | 
|  | 603 | if not args.html: | 
| Brad Bishop | 0011132 | 2018-04-01 22:23:53 -0400 | [diff] [blame] | 604 | print_diff_report(data[0].metadata, data[0].results, | 
|  | 605 | data[1].metadata, data[1].results) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 606 | else: | 
| Brad Bishop | 0011132 | 2018-04-01 22:23:53 -0400 | [diff] [blame] | 607 | # Re-map 'left' list index to the data table where index_0 maps to 0 | 
|  | 608 | print_html_report(data, index_l - index_0, buildstats) | 
| Brad Bishop | 6e60e8b | 2018-02-01 10:27:11 -0500 | [diff] [blame] | 609 |  | 
|  | 610 | return 0 | 
|  | 611 |  | 
|  | 612 | if __name__ == "__main__": | 
|  | 613 | sys.exit(main()) |