Blame - poky/scripts/lib/resulttool/regression.py - openbmc/openbmc

2023-08-11 09:48:11 -0500

[diff] [blame]

185

def get_status_str(raw_status):

186

raw_status_lower = raw_status.lower() if raw_status else "None"

187

return STATUS_STRINGS.get(raw_status_lower, raw_status)

Andrew Geissler

6aa7eec

2023-03-03 12:41:14 -0600

[diff] [blame]

188

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

189

def get_additional_info_line(new_pass_count, new_tests):

190

result=[]

191

if new_tests:

192

result.append(f'+{new_tests} test(s) present')

193

if new_pass_count:

194

result.append(f'+{new_pass_count} test(s) now passing')

if not result:

return ""

return ' -> ' + ', '.join(result) + '\n'

200

201

def compare_result(logger, base_name, target_name, base_result, target_result, display_limit=None):

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

202

base_result = base_result.get('result')

203

target_result = target_result.get('result')

204

result = {}

Patrick Williams

2023-08-11 09:48:11 -0500

[diff] [blame]

205

new_tests = 0

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

regressions = {}

resultstring = ""

new_tests = 0

new_pass_count = 0

display_limit = int(display_limit) if display_limit else REGRESSIONS_DISPLAY_LIMIT

Patrick Williams

2023-08-11 09:48:11 -0500

[diff] [blame]

212

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

213

if base_result and target_result:

214

for k in base_result:

215

base_testcase = base_result[k]

216

base_status = base_testcase.get('status')

217

if base_status:

218

target_testcase = target_result.get(k, {})

219

target_status = target_testcase.get('status')

220

if base_status != target_status:

221

result[k] = {'base': base_status, 'target': target_status}

222

else:

223

logger.error('Failed to retrieved base test case status: %s' % k)

Patrick Williams

2023-08-11 09:48:11 -0500

[diff] [blame]

224

225

# Also count new tests that were not present in base results: it

226

# could be newly added tests, but it could also highlights some tests

227

# renames or fixed faulty ptests

228

for k in target_result:

229

if k not in base_result:

230

new_tests += 1

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

231

if result:

Andrew Geissler

2023-03-31 09:59:46 -0500

[diff] [blame]

232

new_pass_count = sum(test['target'] is not None and test['target'].startswith("PASS") for test in result.values())

233

# Print a regression report only if at least one test has a regression status (FAIL, SKIPPED, absent...)

234

if new_pass_count < len(result):

235

resultstring = "Regression: %s\n %s\n" % (base_name, target_name)

236

for k in sorted(result):

237

if not result[k]['target'] or not result[k]['target'].startswith("PASS"):

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

238

# Differentiate each ptest kind when listing regressions

239

key_parts = k.split('.')

240

key = '.'.join(key_parts[:2]) if k.startswith('ptest') else key_parts[0]

241

# Append new regression to corresponding test family

242

regressions[key] = regressions.setdefault(key, []) + [' %s: %s -> %s\n' % (k, get_status_str(result[k]['base']), get_status_str(result[k]['target']))]

243

resultstring += f" Total: {sum([len(regressions[r]) for r in regressions])} new regression(s):\n"

244

for k in regressions:

245

resultstring += f" {len(regressions[k])} regression(s) for {k}\n"

246

count_to_print=min([display_limit, len(regressions[k])]) if display_limit > 0 else len(regressions[k])

247

resultstring += ''.join(regressions[k][:count_to_print])

248

if count_to_print < len(regressions[k]):

249

resultstring+=' [...]\n'

Andrew Geissler

2023-03-31 09:59:46 -0500

[diff] [blame]

250

if new_pass_count > 0:

251

resultstring += f' Additionally, {new_pass_count} previously failing test(s) is/are now passing\n'

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

252

if new_tests > 0:

253

resultstring += f' Additionally, {new_tests} new test(s) is/are present\n'

Andrew Geissler

2023-03-31 09:59:46 -0500

[diff] [blame]

254

else:

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

255

resultstring = "%s\n%s\n" % (base_name, target_name)

Andrew Geissler

2023-03-31 09:59:46 -0500

[diff] [blame]

256

result = None

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

257

else:

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

258

resultstring = "%s\n%s\n" % (base_name, target_name)

Patrick Williams

2023-08-11 09:48:11 -0500

[diff] [blame]

259

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

260

if not result:

261

additional_info = get_additional_info_line(new_pass_count, new_tests)

262

if additional_info:

263

resultstring += additional_info

264

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

265

return result, resultstring

266

267

def get_results(logger, source):

268

return resultutils.load_resultsdata(source, configmap=resultutils.regression_map)

269

270

def regression(args, logger):

271

base_results = get_results(logger, args.base_result)

272

target_results = get_results(logger, args.target_result)

273

274

regression_common(args, logger, base_results, target_results)

275

Andrew Geissler

2023-03-31 09:59:46 -0500

[diff] [blame]

276

# Some test case naming is poor and contains random strings, particularly lttng/babeltrace.

277

# Truncating the test names works since they contain file and line number identifiers

278

# which allows us to match them without the random components.

279

def fixup_ptest_names(results, logger):

280

for r in results:

281

for i in results[r]:

282

tests = list(results[r][i]['result'].keys())

283

for test in tests:

284

new = None

285

if test.startswith(("ptestresult.lttng-tools.", "ptestresult.babeltrace.", "ptestresult.babeltrace2")) and "_-_" in test:

286

new = test.split("_-_")[0]

287

elif test.startswith(("ptestresult.curl.")) and "__" in test:

288

new = test.split("__")[0]

289

elif test.startswith(("ptestresult.dbus.")) and "__" in test:

290

new = test.split("__")[0]

291

elif test.startswith("ptestresult.binutils") and "build-st-" in test:

292

new = test.split(" ")[0]

293

elif test.startswith("ptestresult.gcc") and "/tmp/runtest." in test:

294

new = ".".join(test.split(".")[:2])

295

if new:

296

results[r][i]['result'][new] = results[r][i]['result'][test]

297

del results[r][i]['result'][test]

298

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

299

def regression_common(args, logger, base_results, target_results):

300

if args.base_result_id:

301

base_results = resultutils.filter_resultsdata(base_results, args.base_result_id)

302

if args.target_result_id:

303

target_results = resultutils.filter_resultsdata(target_results, args.target_result_id)

304

Andrew Geissler

2023-03-31 09:59:46 -0500

[diff] [blame]

305

fixup_ptest_names(base_results, logger)

306

fixup_ptest_names(target_results, logger)

307

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

matches = []

regressions = []

notfound = []

for a in base_results:

313

if a in target_results:

314

base = list(base_results[a].keys())

315

target = list(target_results[a].keys())

Brad Bishop

c342db3

2019-05-15 21:57:59 -0400

[diff] [blame]

316

# We may have multiple base/targets which are for different configurations. Start by

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

317

# removing any pairs which match

318

for c in base.copy():

319

for b in target.copy():

Andrew Geissler

6aa7eec

2023-03-03 12:41:14 -0600

[diff] [blame]

320

if not can_be_compared(logger, base_results[a][c], target_results[a][b]):

321

continue

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

322

res, resstr = compare_result(logger, c, b, base_results[a][c], target_results[a][b], args.limit)

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

323

if not res:

324

matches.append(resstr)

base.remove(c)

target.remove(b)

break

# Should only now see regressions, we may not be able to match multiple pairs directly

329

for c in base:

330

for b in target:

Andrew Geissler

6aa7eec

2023-03-03 12:41:14 -0600

[diff] [blame]

331

if not can_be_compared(logger, base_results[a][c], target_results[a][b]):

332

continue

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

333

res, resstr = compare_result(logger, c, b, base_results[a][c], target_results[a][b], args.limit)

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

334

if res:

335

regressions.append(resstr)

336

else:

337

notfound.append("%s not found in target" % a)

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

338

print("\n".join(sorted(regressions)))

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

339

print("\n" + MISSING_TESTS_BANNER + "\n")

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

340

print("\n".join(sorted(notfound)))

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

341

print("\n" + ADDITIONAL_DATA_BANNER + "\n")

342

print("\n".join(sorted(matches)))

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

343

return 0

344

345

def regression_git(args, logger):

base_results = {}

target_results = {}

tag_name = "{branch}/{commit_number}-g{commit}/{tag_number}"

350

repo = GitRepo(args.repo)

351

352

revs = gitarchive.get_test_revs(logger, repo, tag_name, branch=args.branch)

353

354

if args.branch2:

355

revs2 = gitarchive.get_test_revs(logger, repo, tag_name, branch=args.branch2)

356

if not len(revs2):

357

logger.error("No revisions found to compare against")

358

return 1

359

if not len(revs):

360

logger.error("No revision to report on found")

return 1

else:

if len(revs) < 2:

logger.error("Only %d tester revisions found, unable to generate report" % len(revs))

return 1

# Pick revisions

if args.commit:

if args.commit_number:

370

logger.warning("Ignoring --commit-number as --commit was specified")

371

index1 = gitarchive.rev_find(revs, 'commit', args.commit)

372

elif args.commit_number:

373

index1 = gitarchive.rev_find(revs, 'commit_number', args.commit_number)

374

else:

375

index1 = len(revs) - 1

376

377

if args.branch2:

378

revs2.append(revs[index1])

379

index1 = len(revs2) - 1

revs = revs2

if args.commit2:

if args.commit_number2:

384

logger.warning("Ignoring --commit-number2 as --commit2 was specified")

385

index2 = gitarchive.rev_find(revs, 'commit', args.commit2)

386

elif args.commit_number2:

387

index2 = gitarchive.rev_find(revs, 'commit_number', args.commit_number2)

else:

if index1 > 0:

index2 = index1 - 1

# Find the closest matching commit number for comparision

392

# In future we could check the commit is a common ancestor and

393

# continue back if not but this good enough for now

394

while index2 > 0 and revs[index2].commit_number > revs[index1].commit_number:

395

index2 = index2 - 1

396

else:

397

logger.error("Unable to determine the other commit, use "

398

"--commit2 or --commit-number2 to specify it")

399

return 1

400

401

logger.info("Comparing:\n%s\nto\n%s\n" % (revs[index1], revs[index2]))

402

403

base_results = resultutils.git_get_result(repo, revs[index1][2])

404

target_results = resultutils.git_get_result(repo, revs[index2][2])

405

406

regression_common(args, logger, base_results, target_results)

return 0

def register_commands(subparsers):

411

"""Register subcommands from this plugin"""

412

413

parser_build = subparsers.add_parser('regression', help='regression file/directory analysis',

414

description='regression analysis comparing the base set of results to the target results',

415

group='analysis')

416

parser_build.set_defaults(func=regression)

417

parser_build.add_argument('base_result',

Brad Bishop

c342db3

2019-05-15 21:57:59 -0400

[diff] [blame]

418

help='base result file/directory/URL for the comparison')

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

419

parser_build.add_argument('target_result',

Brad Bishop

c342db3

2019-05-15 21:57:59 -0400

[diff] [blame]

420

help='target result file/directory/URL to compare with')

Brad Bishop

2019-03-26 16:08:25 -0400

[diff] [blame]

421

parser_build.add_argument('-b', '--base-result-id', default='',

422

help='(optional) filter the base results to this result ID')

423

parser_build.add_argument('-t', '--target-result-id', default='',

424

help='(optional) filter the target results to this result ID')

425

426

parser_build = subparsers.add_parser('regression-git', help='regression git analysis',

427

description='regression analysis comparing base result set to target '

428

'result set',

429

group='analysis')

430

parser_build.set_defaults(func=regression_git)

431

parser_build.add_argument('repo',

432

help='the git repository containing the data')

433

parser_build.add_argument('-b', '--base-result-id', default='',

434

help='(optional) default select regression based on configurations unless base result '

435

'id was provided')

436

parser_build.add_argument('-t', '--target-result-id', default='',

437

help='(optional) default select regression based on configurations unless target result '

438

'id was provided')

439

440

parser_build.add_argument('--branch', '-B', default='master', help="Branch to find commit in")

441

parser_build.add_argument('--branch2', help="Branch to find comparision revisions in")

442

parser_build.add_argument('--commit', help="Revision to search for")

443

parser_build.add_argument('--commit-number', help="Revision number to search for, redundant if --commit is specified")

444

parser_build.add_argument('--commit2', help="Revision to compare with")

445

parser_build.add_argument('--commit-number2', help="Revision number to compare with, redundant if --commit2 is specified")

Patrick Williams

2023-11-24 18:59:46 -0600

[diff] [blame]

446

parser_build.add_argument('-l', '--limit', default=REGRESSIONS_DISPLAY_LIMIT, help="Maximum number of changes to display per test. Can be set to 0 to print all changes")

Brad Bishop