| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 1 | #!/usr/bin/python3 | 
 | 2 | # | 
 | 3 | # Script for comparing buildstats from two different builds | 
 | 4 | # | 
 | 5 | # Copyright (c) 2016, Intel Corporation. | 
 | 6 | # | 
| Brad Bishop | c342db3 | 2019-05-15 21:57:59 -0400 | [diff] [blame] | 7 | # SPDX-License-Identifier: GPL-2.0-only | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 8 | # | 
| Brad Bishop | c342db3 | 2019-05-15 21:57:59 -0400 | [diff] [blame] | 9 |  | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 10 | import argparse | 
 | 11 | import glob | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 12 | import logging | 
 | 13 | import math | 
 | 14 | import os | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 15 | import sys | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 16 | from operator import attrgetter | 
 | 17 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 18 | # Import oe libs | 
 | 19 | scripts_path = os.path.dirname(os.path.realpath(__file__)) | 
 | 20 | sys.path.append(os.path.join(scripts_path, 'lib')) | 
 | 21 | from buildstats import BuildStats, diff_buildstats, taskdiff_fields, BSVerDiff | 
 | 22 |  | 
 | 23 |  | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 24 | # Setup logging | 
 | 25 | logging.basicConfig(level=logging.INFO, format="%(levelname)s: %(message)s") | 
 | 26 | log = logging.getLogger() | 
 | 27 |  | 
 | 28 |  | 
 | 29 | class ScriptError(Exception): | 
 | 30 |     """Exception for internal error handling of this script""" | 
 | 31 |     pass | 
 | 32 |  | 
 | 33 |  | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 34 | def read_buildstats(path, multi): | 
 | 35 |     """Read buildstats""" | 
 | 36 |     if not os.path.exists(path): | 
 | 37 |         raise ScriptError("No such file or directory: {}".format(path)) | 
 | 38 |  | 
 | 39 |     if os.path.isfile(path): | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 40 |         return BuildStats.from_file_json(path) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 41 |  | 
 | 42 |     if os.path.isfile(os.path.join(path, 'build_stats')): | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 43 |         return BuildStats.from_dir(path) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 44 |  | 
 | 45 |     # Handle a non-buildstat directory | 
 | 46 |     subpaths = sorted(glob.glob(path + '/*')) | 
 | 47 |     if len(subpaths) > 1: | 
 | 48 |         if multi: | 
 | 49 |             log.info("Averaging over {} buildstats from {}".format( | 
 | 50 |                      len(subpaths), path)) | 
 | 51 |         else: | 
 | 52 |             raise ScriptError("Multiple buildstats found in '{}'. Please give " | 
 | 53 |                               "a single buildstat directory of use the --multi " | 
 | 54 |                               "option".format(path)) | 
 | 55 |     bs = None | 
 | 56 |     for subpath in subpaths: | 
 | 57 |         if os.path.isfile(subpath): | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 58 |             _bs = BuildStats.from_file_json(subpath) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 59 |         else: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 60 |             _bs = BuildStats.from_dir(subpath) | 
 | 61 |         if bs is None: | 
 | 62 |             bs = _bs | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 63 |         else: | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 64 |             bs.aggregate(_bs) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 65 |     if not bs: | 
 | 66 |         raise ScriptError("No buildstats found under {}".format(path)) | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 67 |  | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 68 |     return bs | 
 | 69 |  | 
 | 70 |  | 
 | 71 | def print_ver_diff(bs1, bs2): | 
 | 72 |     """Print package version differences""" | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 73 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 74 |     diff = BSVerDiff(bs1, bs2) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 75 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 76 |     maxlen = max([len(r) for r in set(bs1.keys()).union(set(bs2.keys()))]) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 77 |     fmt_str = "  {:{maxlen}} ({})" | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 78 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 79 |     if diff.new: | 
 | 80 |         print("\nNEW RECIPES:") | 
 | 81 |         print("------------") | 
 | 82 |         for name, val in sorted(diff.new.items()): | 
 | 83 |             print(fmt_str.format(name, val.nevr, maxlen=maxlen)) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 84 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 85 |     if diff.dropped: | 
 | 86 |         print("\nDROPPED RECIPES:") | 
 | 87 |         print("----------------") | 
 | 88 |         for name, val in sorted(diff.dropped.items()): | 
 | 89 |             print(fmt_str.format(name, val.nevr, maxlen=maxlen)) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 90 |  | 
 | 91 |     fmt_str = "  {0:{maxlen}} {1:<20}    ({2})" | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 92 |     if diff.rchanged: | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 93 |         print("\nREVISION CHANGED:") | 
 | 94 |         print("-----------------") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 95 |         for name, val in sorted(diff.rchanged.items()): | 
 | 96 |             field1 = "{} -> {}".format(val.left.revision, val.right.revision) | 
 | 97 |             field2 = "{} -> {}".format(val.left.nevr, val.right.nevr) | 
 | 98 |             print(fmt_str.format(name, field1, field2, maxlen=maxlen)) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 99 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 100 |     if diff.vchanged: | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 101 |         print("\nVERSION CHANGED:") | 
 | 102 |         print("----------------") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 103 |         for name, val in sorted(diff.vchanged.items()): | 
 | 104 |             field1 = "{} -> {}".format(val.left.version, val.right.version) | 
 | 105 |             field2 = "{} -> {}".format(val.left.nevr, val.right.nevr) | 
 | 106 |             print(fmt_str.format(name, field1, field2, maxlen=maxlen)) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 107 |  | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 108 |     if diff.echanged: | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 109 |         print("\nEPOCH CHANGED:") | 
 | 110 |         print("--------------") | 
| Brad Bishop | d7bf8c1 | 2018-02-25 22:55:05 -0500 | [diff] [blame] | 111 |         for name, val in sorted(diff.echanged.items()): | 
 | 112 |             field1 = "{} -> {}".format(val.left.epoch, val.right.epoch) | 
 | 113 |             field2 = "{} -> {}".format(val.left.nevr, val.right.nevr) | 
 | 114 |             print(fmt_str.format(name, field1, field2, maxlen=maxlen)) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 115 |  | 
 | 116 |  | 
| Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 117 | def print_task_diff(bs1, bs2, val_type, min_val=0, min_absdiff=0, sort_by=('absdiff',), only_tasks=[]): | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 118 |     """Diff task execution times""" | 
 | 119 |     def val_to_str(val, human_readable=False): | 
 | 120 |         """Convert raw value to printable string""" | 
 | 121 |         def hms_time(secs): | 
 | 122 |             """Get time in human-readable HH:MM:SS format""" | 
 | 123 |             h = int(secs / 3600) | 
 | 124 |             m = int((secs % 3600) / 60) | 
 | 125 |             s = secs % 60 | 
 | 126 |             if h == 0: | 
 | 127 |                 return "{:02d}:{:04.1f}".format(m, s) | 
 | 128 |             else: | 
 | 129 |                 return "{:d}:{:02d}:{:04.1f}".format(h, m, s) | 
 | 130 |  | 
 | 131 |         if 'time' in val_type: | 
 | 132 |             if human_readable: | 
 | 133 |                 return hms_time(val) | 
 | 134 |             else: | 
 | 135 |                 return "{:.1f}s".format(val) | 
 | 136 |         elif 'bytes' in val_type and human_readable: | 
 | 137 |                 prefix = ['', 'Ki', 'Mi', 'Gi', 'Ti', 'Pi'] | 
 | 138 |                 dec = int(math.log(val, 2) / 10) | 
 | 139 |                 prec = 1 if dec > 0 else 0 | 
 | 140 |                 return "{:.{prec}f}{}B".format(val / (2 ** (10 * dec)), | 
 | 141 |                                                prefix[dec], prec=prec) | 
 | 142 |         elif 'ops' in val_type and human_readable: | 
 | 143 |                 prefix = ['', 'k', 'M', 'G', 'T', 'P'] | 
 | 144 |                 dec = int(math.log(val, 1000)) | 
 | 145 |                 prec = 1 if dec > 0 else 0 | 
 | 146 |                 return "{:.{prec}f}{}ops".format(val / (1000 ** dec), | 
 | 147 |                                                  prefix[dec], prec=prec) | 
 | 148 |         return str(int(val)) | 
 | 149 |  | 
 | 150 |     def sum_vals(buildstats): | 
 | 151 |         """Get cumulative sum of all tasks""" | 
 | 152 |         total = 0.0 | 
 | 153 |         for recipe_data in buildstats.values(): | 
| Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 154 |             for name, bs_task in recipe_data.tasks.items(): | 
 | 155 |                 if not only_tasks or name in only_tasks: | 
 | 156 |                     total += getattr(bs_task, val_type) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 157 |         return total | 
 | 158 |  | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 159 |     if min_val: | 
 | 160 |         print("Ignoring tasks less than {} ({})".format( | 
 | 161 |                 val_to_str(min_val, True), val_to_str(min_val))) | 
 | 162 |     if min_absdiff: | 
 | 163 |         print("Ignoring differences less than {} ({})".format( | 
 | 164 |                 val_to_str(min_absdiff, True), val_to_str(min_absdiff))) | 
 | 165 |  | 
 | 166 |     # Prepare the data | 
| Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 167 |     tasks_diff = diff_buildstats(bs1, bs2, val_type, min_val, min_absdiff, only_tasks) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 168 |  | 
 | 169 |     # Sort our list | 
 | 170 |     for field in reversed(sort_by): | 
 | 171 |         if field.startswith('-'): | 
 | 172 |             field = field[1:] | 
 | 173 |             reverse = True | 
 | 174 |         else: | 
 | 175 |             reverse = False | 
 | 176 |         tasks_diff = sorted(tasks_diff, key=attrgetter(field), reverse=reverse) | 
 | 177 |  | 
 | 178 |     linedata = [('  ', 'PKG', '  ', 'TASK', 'ABSDIFF', 'RELDIFF', | 
 | 179 |                 val_type.upper() + '1', val_type.upper() + '2')] | 
 | 180 |     field_lens = dict([('len_{}'.format(i), len(f)) for i, f in enumerate(linedata[0])]) | 
 | 181 |  | 
 | 182 |     # Prepare fields in string format and measure field lengths | 
 | 183 |     for diff in tasks_diff: | 
 | 184 |         task_prefix = diff.task_op if diff.pkg_op == '  ' else '  ' | 
 | 185 |         linedata.append((diff.pkg_op, diff.pkg, task_prefix, diff.task, | 
 | 186 |                          val_to_str(diff.absdiff), | 
 | 187 |                          '{:+.1f}%'.format(diff.reldiff), | 
 | 188 |                          val_to_str(diff.value1), | 
 | 189 |                          val_to_str(diff.value2))) | 
 | 190 |         for i, field in enumerate(linedata[-1]): | 
 | 191 |             key = 'len_{}'.format(i) | 
 | 192 |             if len(field) > field_lens[key]: | 
 | 193 |                 field_lens[key] = len(field) | 
 | 194 |  | 
 | 195 |     # Print data | 
 | 196 |     print() | 
 | 197 |     for fields in linedata: | 
 | 198 |         print("{:{len_0}}{:{len_1}}  {:{len_2}}{:{len_3}}  {:>{len_4}}  {:>{len_5}}  {:>{len_6}} -> {:{len_7}}".format( | 
 | 199 |                 *fields, **field_lens)) | 
 | 200 |  | 
 | 201 |     # Print summary of the diffs | 
 | 202 |     total1 = sum_vals(bs1) | 
 | 203 |     total2 = sum_vals(bs2) | 
 | 204 |     print("\nCumulative {}:".format(val_type)) | 
 | 205 |     print ("  {}    {:+.1f}%    {} ({}) -> {} ({})".format( | 
 | 206 |                 val_to_str(total2 - total1), 100 * (total2-total1) / total1, | 
 | 207 |                 val_to_str(total1, True), val_to_str(total1), | 
 | 208 |                 val_to_str(total2, True), val_to_str(total2))) | 
 | 209 |  | 
 | 210 |  | 
 | 211 | def parse_args(argv): | 
 | 212 |     """Parse cmdline arguments""" | 
 | 213 |     description=""" | 
 | 214 | Script for comparing buildstats of two separate builds.""" | 
 | 215 |     parser = argparse.ArgumentParser( | 
 | 216 |             formatter_class=argparse.ArgumentDefaultsHelpFormatter, | 
 | 217 |             description=description) | 
 | 218 |  | 
 | 219 |     min_val_defaults = {'cputime': 3.0, | 
 | 220 |                         'read_bytes': 524288, | 
 | 221 |                         'write_bytes': 524288, | 
 | 222 |                         'read_ops': 500, | 
 | 223 |                         'write_ops': 500, | 
 | 224 |                         'walltime': 5} | 
 | 225 |     min_absdiff_defaults = {'cputime': 1.0, | 
 | 226 |                             'read_bytes': 131072, | 
 | 227 |                             'write_bytes': 131072, | 
 | 228 |                             'read_ops': 50, | 
 | 229 |                             'write_ops': 50, | 
 | 230 |                             'walltime': 2} | 
 | 231 |  | 
 | 232 |     parser.add_argument('--debug', '-d', action='store_true', | 
 | 233 |                         help="Verbose logging") | 
 | 234 |     parser.add_argument('--ver-diff', action='store_true', | 
 | 235 |                         help="Show package version differences and exit") | 
 | 236 |     parser.add_argument('--diff-attr', default='cputime', | 
 | 237 |                         choices=min_val_defaults.keys(), | 
 | 238 |                         help="Buildstat attribute which to compare") | 
 | 239 |     parser.add_argument('--min-val', default=min_val_defaults, type=float, | 
 | 240 |                         help="Filter out tasks less than MIN_VAL. " | 
 | 241 |                              "Default depends on --diff-attr.") | 
 | 242 |     parser.add_argument('--min-absdiff', default=min_absdiff_defaults, type=float, | 
 | 243 |                         help="Filter out tasks whose difference is less than " | 
 | 244 |                              "MIN_ABSDIFF, Default depends on --diff-attr.") | 
 | 245 |     parser.add_argument('--sort-by', default='absdiff', | 
 | 246 |                         help="Comma-separated list of field sort order. " | 
 | 247 |                              "Prepend the field name with '-' for reversed sort. " | 
 | 248 |                              "Available fields are: {}".format(', '.join(taskdiff_fields))) | 
 | 249 |     parser.add_argument('--multi', action='store_true', | 
 | 250 |                         help="Read all buildstats from the given paths and " | 
 | 251 |                              "average over them") | 
| Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 252 |     parser.add_argument('--only-task', dest='only_tasks', metavar='TASK', action='append', default=[], | 
 | 253 |                         help="Only include TASK in report. May be specified multiple times") | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 254 |     parser.add_argument('buildstats1', metavar='BUILDSTATS1', help="'Left' buildstat") | 
 | 255 |     parser.add_argument('buildstats2', metavar='BUILDSTATS2', help="'Right' buildstat") | 
 | 256 |  | 
 | 257 |     args = parser.parse_args(argv) | 
 | 258 |  | 
 | 259 |     # We do not nedd/want to read all buildstats if we just want to look at the | 
 | 260 |     # package versions | 
 | 261 |     if args.ver_diff: | 
 | 262 |         args.multi = False | 
 | 263 |  | 
 | 264 |     # Handle defaults for the filter arguments | 
 | 265 |     if args.min_val is min_val_defaults: | 
 | 266 |         args.min_val = min_val_defaults[args.diff_attr] | 
 | 267 |     if args.min_absdiff is min_absdiff_defaults: | 
 | 268 |         args.min_absdiff = min_absdiff_defaults[args.diff_attr] | 
 | 269 |  | 
 | 270 |     return args | 
 | 271 |  | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 272 | def main(argv=None): | 
 | 273 |     """Script entry point""" | 
 | 274 |     args = parse_args(argv) | 
 | 275 |     if args.debug: | 
 | 276 |         log.setLevel(logging.DEBUG) | 
 | 277 |  | 
 | 278 |     # Validate sort fields | 
 | 279 |     sort_by = [] | 
 | 280 |     for field in args.sort_by.split(','): | 
 | 281 |         if field.lstrip('-') not in taskdiff_fields: | 
 | 282 |             log.error("Invalid sort field '%s' (must be one of: %s)" % | 
 | 283 |                       (field, ', '.join(taskdiff_fields))) | 
 | 284 |             sys.exit(1) | 
 | 285 |         sort_by.append(field) | 
 | 286 |  | 
 | 287 |     try: | 
 | 288 |         bs1 = read_buildstats(args.buildstats1, args.multi) | 
 | 289 |         bs2 = read_buildstats(args.buildstats2, args.multi) | 
 | 290 |  | 
 | 291 |         if args.ver_diff: | 
 | 292 |             print_ver_diff(bs1, bs2) | 
 | 293 |         else: | 
 | 294 |             print_task_diff(bs1, bs2, args.diff_attr, args.min_val, | 
| Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 295 |                             args.min_absdiff, sort_by, args.only_tasks) | 
| Patrick Williams | c0f7c04 | 2017-02-23 20:41:17 -0600 | [diff] [blame] | 296 |     except ScriptError as err: | 
 | 297 |         log.error(str(err)) | 
 | 298 |         return 1 | 
 | 299 |     return 0 | 
 | 300 |  | 
 | 301 | if __name__ == "__main__": | 
 | 302 |     sys.exit(main()) |