blob: 542bbb9d133f4c43e6ee1c2248165662a60a7f09 [file] [log] [blame]
Patrick Williamsc124f4f2015-09-15 14:41:29 -05001import hashlib
2import logging
3import os
4import re
5import tempfile
Patrick Williamsc0f7c042017-02-23 20:41:17 -06006import pickle
Patrick Williamsc124f4f2015-09-15 14:41:29 -05007import bb.data
Patrick Williamsd8c66bc2016-06-20 12:57:21 -05008from bb.checksum import FileChecksumCache
Patrick Williamsc124f4f2015-09-15 14:41:29 -05009
10logger = logging.getLogger('BitBake.SigGen')
11
Patrick Williamsc124f4f2015-09-15 14:41:29 -050012def init(d):
Patrick Williamsc0f7c042017-02-23 20:41:17 -060013 siggens = [obj for obj in globals().values()
Patrick Williamsc124f4f2015-09-15 14:41:29 -050014 if type(obj) is type and issubclass(obj, SignatureGenerator)]
15
16 desired = d.getVar("BB_SIGNATURE_HANDLER", True) or "noop"
17 for sg in siggens:
18 if desired == sg.name:
19 return sg(d)
20 break
21 else:
22 logger.error("Invalid signature generator '%s', using default 'noop'\n"
23 "Available generators: %s", desired,
24 ', '.join(obj.name for obj in siggens))
25 return SignatureGenerator(d)
26
27class SignatureGenerator(object):
28 """
29 """
30 name = "noop"
31
32 def __init__(self, data):
Brad Bishop37a0e4d2017-12-04 01:01:44 -050033 self.basehash = {}
Patrick Williamsc124f4f2015-09-15 14:41:29 -050034 self.taskhash = {}
35 self.runtaskdeps = {}
36 self.file_checksum_values = {}
Patrick Williamsd8c66bc2016-06-20 12:57:21 -050037 self.taints = {}
Patrick Williamsc124f4f2015-09-15 14:41:29 -050038
39 def finalise(self, fn, d, varient):
40 return
41
42 def get_taskhash(self, fn, task, deps, dataCache):
43 return "0"
44
Patrick Williamsd8c66bc2016-06-20 12:57:21 -050045 def writeout_file_checksum_cache(self):
46 """Write/update the file checksum cache onto disk"""
Patrick Williamsc124f4f2015-09-15 14:41:29 -050047 return
48
49 def stampfile(self, stampbase, file_name, taskname, extrainfo):
50 return ("%s.%s.%s" % (stampbase, taskname, extrainfo)).rstrip('.')
51
52 def stampcleanmask(self, stampbase, file_name, taskname, extrainfo):
53 return ("%s.%s.%s" % (stampbase, taskname, extrainfo)).rstrip('.')
54
55 def dump_sigtask(self, fn, task, stampbase, runtime):
56 return
57
58 def invalidate_task(self, task, d, fn):
59 bb.build.del_stamp(task, d, fn)
60
61 def dump_sigs(self, dataCache, options):
62 return
63
64 def get_taskdata(self):
Brad Bishop37a0e4d2017-12-04 01:01:44 -050065 return (self.runtaskdeps, self.taskhash, self.file_checksum_values, self.taints, self.basehash)
Patrick Williamsc124f4f2015-09-15 14:41:29 -050066
67 def set_taskdata(self, data):
Brad Bishop37a0e4d2017-12-04 01:01:44 -050068 self.runtaskdeps, self.taskhash, self.file_checksum_values, self.taints, self.basehash = data
Patrick Williamsc124f4f2015-09-15 14:41:29 -050069
70class SignatureGeneratorBasic(SignatureGenerator):
71 """
72 """
73 name = "basic"
74
75 def __init__(self, data):
76 self.basehash = {}
77 self.taskhash = {}
78 self.taskdeps = {}
79 self.runtaskdeps = {}
80 self.file_checksum_values = {}
Patrick Williamsf1e5d692016-03-30 15:21:19 -050081 self.taints = {}
Patrick Williamsc124f4f2015-09-15 14:41:29 -050082 self.gendeps = {}
83 self.lookupcache = {}
84 self.pkgnameextract = re.compile("(?P<fn>.*)\..*")
85 self.basewhitelist = set((data.getVar("BB_HASHBASE_WHITELIST", True) or "").split())
86 self.taskwhitelist = None
87 self.init_rundepcheck(data)
Patrick Williamsd8c66bc2016-06-20 12:57:21 -050088 checksum_cache_file = data.getVar("BB_HASH_CHECKSUM_CACHE_FILE", True)
89 if checksum_cache_file:
90 self.checksum_cache = FileChecksumCache()
91 self.checksum_cache.init_cache(data, checksum_cache_file)
92 else:
93 self.checksum_cache = None
Patrick Williamsc124f4f2015-09-15 14:41:29 -050094
95 def init_rundepcheck(self, data):
96 self.taskwhitelist = data.getVar("BB_HASHTASK_WHITELIST", True) or None
97 if self.taskwhitelist:
98 self.twl = re.compile(self.taskwhitelist)
99 else:
100 self.twl = None
101
102 def _build_data(self, fn, d):
103
104 tasklist, gendeps, lookupcache = bb.data.generate_dependencies(d)
105
106 taskdeps = {}
107 basehash = {}
108
109 for task in tasklist:
110 data = lookupcache[task]
111
112 if data is None:
113 bb.error("Task %s from %s seems to be empty?!" % (task, fn))
114 data = ''
115
116 gendeps[task] -= self.basewhitelist
117 newdeps = gendeps[task]
118 seen = set()
119 while newdeps:
120 nextdeps = newdeps
121 seen |= nextdeps
122 newdeps = set()
123 for dep in nextdeps:
124 if dep in self.basewhitelist:
125 continue
126 gendeps[dep] -= self.basewhitelist
127 newdeps |= gendeps[dep]
128 newdeps -= seen
129
130 alldeps = sorted(seen)
131 for dep in alldeps:
132 data = data + dep
133 var = lookupcache[dep]
134 if var is not None:
135 data = data + str(var)
Brad Bishop37a0e4d2017-12-04 01:01:44 -0500136 datahash = hashlib.md5(data.encode("utf-8")).hexdigest()
137 k = fn + "." + task
138 if k in self.basehash and self.basehash[k] != datahash:
139 bb.error("When reparsing %s, the basehash value changed from %s to %s. The metadata is not deterministic and this needs to be fixed." % (k, self.basehash[k], datahash))
140 self.basehash[k] = datahash
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500141 taskdeps[task] = alldeps
142
143 self.taskdeps[fn] = taskdeps
144 self.gendeps[fn] = gendeps
145 self.lookupcache[fn] = lookupcache
146
147 return taskdeps
148
149 def finalise(self, fn, d, variant):
150
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600151 mc = d.getVar("__BBMULTICONFIG", False) or ""
152 if variant or mc:
153 fn = bb.cache.realfn2virtual(fn, variant, mc)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500154
155 try:
156 taskdeps = self._build_data(fn, d)
157 except:
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500158 bb.warn("Error during finalise of %s" % fn)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500159 raise
160
161 #Slow but can be useful for debugging mismatched basehashes
162 #for task in self.taskdeps[fn]:
163 # self.dump_sigtask(fn, task, d.getVar("STAMP", True), False)
164
165 for task in taskdeps:
166 d.setVar("BB_BASEHASH_task-%s" % task, self.basehash[fn + "." + task])
167
168 def rundep_check(self, fn, recipename, task, dep, depname, dataCache):
169 # Return True if we should keep the dependency, False to drop it
170 # We only manipulate the dependencies for packages not in the whitelist
171 if self.twl and not self.twl.search(recipename):
172 # then process the actual dependencies
173 if self.twl.search(depname):
174 return False
175 return True
176
177 def read_taint(self, fn, task, stampbase):
178 taint = None
179 try:
180 with open(stampbase + '.' + task + '.taint', 'r') as taintf:
181 taint = taintf.read()
182 except IOError:
183 pass
184 return taint
185
186 def get_taskhash(self, fn, task, deps, dataCache):
187 k = fn + "." + task
188 data = dataCache.basetaskhash[k]
Brad Bishop37a0e4d2017-12-04 01:01:44 -0500189 self.basehash[k] = data
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500190 self.runtaskdeps[k] = []
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500191 self.file_checksum_values[k] = []
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500192 recipename = dataCache.pkg_fn[fn]
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500193
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500194 for dep in sorted(deps, key=clean_basepath):
195 depname = dataCache.pkg_fn[self.pkgnameextract.search(dep).group('fn')]
196 if not self.rundep_check(fn, recipename, task, dep, depname, dataCache):
197 continue
198 if dep not in self.taskhash:
199 bb.fatal("%s is not in taskhash, caller isn't calling in dependency order?", dep)
200 data = data + self.taskhash[dep]
201 self.runtaskdeps[k].append(dep)
202
203 if task in dataCache.file_checksums[fn]:
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500204 if self.checksum_cache:
205 checksums = self.checksum_cache.get_checksums(dataCache.file_checksums[fn][task], recipename)
206 else:
207 checksums = bb.fetch2.get_file_checksums(dataCache.file_checksums[fn][task], recipename)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500208 for (f,cs) in checksums:
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500209 self.file_checksum_values[k].append((f,cs))
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500210 if cs:
211 data = data + cs
212
213 taskdep = dataCache.task_deps[fn]
214 if 'nostamp' in taskdep and task in taskdep['nostamp']:
215 # Nostamp tasks need an implicit taint so that they force any dependent tasks to run
216 import uuid
Patrick Williamsf1e5d692016-03-30 15:21:19 -0500217 taint = str(uuid.uuid4())
218 data = data + taint
219 self.taints[k] = "nostamp:" + taint
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500220
221 taint = self.read_taint(fn, task, dataCache.stamp[fn])
222 if taint:
223 data = data + taint
Patrick Williamsf1e5d692016-03-30 15:21:19 -0500224 self.taints[k] = taint
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600225 logger.warning("%s is tainted from a forced run" % k)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500226
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600227 h = hashlib.md5(data.encode("utf-8")).hexdigest()
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500228 self.taskhash[k] = h
229 #d.setVar("BB_TASKHASH_task-%s" % task, taskhash[task])
230 return h
231
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500232 def writeout_file_checksum_cache(self):
233 """Write/update the file checksum cache onto disk"""
234 if self.checksum_cache:
235 self.checksum_cache.save_extras()
236 self.checksum_cache.save_merge()
237 else:
238 bb.fetch2.fetcher_parse_save()
239 bb.fetch2.fetcher_parse_done()
240
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500241 def dump_sigtask(self, fn, task, stampbase, runtime):
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500242
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500243 k = fn + "." + task
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500244 referencestamp = stampbase
245 if isinstance(runtime, str) and runtime.startswith("customfile"):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500246 sigfile = stampbase
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500247 referencestamp = runtime[11:]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500248 elif runtime and k in self.taskhash:
249 sigfile = stampbase + "." + task + ".sigdata" + "." + self.taskhash[k]
250 else:
251 sigfile = stampbase + "." + task + ".sigbasedata" + "." + self.basehash[k]
252
253 bb.utils.mkdirhier(os.path.dirname(sigfile))
254
255 data = {}
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500256 data['task'] = task
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500257 data['basewhitelist'] = self.basewhitelist
258 data['taskwhitelist'] = self.taskwhitelist
259 data['taskdeps'] = self.taskdeps[fn][task]
260 data['basehash'] = self.basehash[k]
261 data['gendeps'] = {}
262 data['varvals'] = {}
263 data['varvals'][task] = self.lookupcache[fn][task]
264 for dep in self.taskdeps[fn][task]:
265 if dep in self.basewhitelist:
266 continue
267 data['gendeps'][dep] = self.gendeps[fn][dep]
268 data['varvals'][dep] = self.lookupcache[fn][dep]
269
270 if runtime and k in self.taskhash:
271 data['runtaskdeps'] = self.runtaskdeps[k]
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500272 data['file_checksum_values'] = [(os.path.basename(f), cs) for f,cs in self.file_checksum_values[k]]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500273 data['runtaskhashes'] = {}
274 for dep in data['runtaskdeps']:
275 data['runtaskhashes'][dep] = self.taskhash[dep]
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500276 data['taskhash'] = self.taskhash[k]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500277
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500278 taint = self.read_taint(fn, task, referencestamp)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500279 if taint:
280 data['taint'] = taint
281
Patrick Williamsf1e5d692016-03-30 15:21:19 -0500282 if runtime and k in self.taints:
283 if 'nostamp:' in self.taints[k]:
284 data['taint'] = self.taints[k]
285
Brad Bishop37a0e4d2017-12-04 01:01:44 -0500286 computed_basehash = calc_basehash(data)
287 if computed_basehash != self.basehash[k]:
288 bb.error("Basehash mismatch %s versus %s for %s" % (computed_basehash, self.basehash[k], k))
289 if runtime and k in self.taskhash:
290 computed_taskhash = calc_taskhash(data)
291 if computed_taskhash != self.taskhash[k]:
292 bb.error("Taskhash mismatch %s versus %s for %s" % (computed_taskhash, self.taskhash[k], k))
293 sigfile = sigfile.replace(self.taskhash[k], computed_taskhash)
294
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500295 fd, tmpfile = tempfile.mkstemp(dir=os.path.dirname(sigfile), prefix="sigtask.")
296 try:
297 with os.fdopen(fd, "wb") as stream:
298 p = pickle.dump(data, stream, -1)
299 stream.flush()
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600300 os.chmod(tmpfile, 0o664)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500301 os.rename(tmpfile, sigfile)
302 except (OSError, IOError) as err:
303 try:
304 os.unlink(tmpfile)
305 except OSError:
306 pass
307 raise err
308
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600309 def dump_sigs(self, dataCaches, options):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500310 for fn in self.taskdeps:
311 for task in self.taskdeps[fn]:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600312 tid = fn + ":" + task
313 (mc, _, _) = bb.runqueue.split_tid(tid)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500314 k = fn + "." + task
315 if k not in self.taskhash:
316 continue
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600317 if dataCaches[mc].basetaskhash[k] != self.basehash[k]:
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500318 bb.error("Bitbake's cached basehash does not match the one we just generated (%s)!" % k)
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600319 bb.error("The mismatched hashes were %s and %s" % (dataCaches[mc].basetaskhash[k], self.basehash[k]))
320 self.dump_sigtask(fn, task, dataCaches[mc].stamp[fn], True)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500321
322class SignatureGeneratorBasicHash(SignatureGeneratorBasic):
323 name = "basichash"
324
325 def stampfile(self, stampbase, fn, taskname, extrainfo, clean=False):
326 if taskname != "do_setscene" and taskname.endswith("_setscene"):
327 k = fn + "." + taskname[:-9]
328 else:
329 k = fn + "." + taskname
330 if clean:
331 h = "*"
332 elif k in self.taskhash:
333 h = self.taskhash[k]
334 else:
335 # If k is not in basehash, then error
336 h = self.basehash[k]
337 return ("%s.%s.%s.%s" % (stampbase, taskname, h, extrainfo)).rstrip('.')
338
339 def stampcleanmask(self, stampbase, fn, taskname, extrainfo):
340 return self.stampfile(stampbase, fn, taskname, extrainfo, clean=True)
341
342 def invalidate_task(self, task, d, fn):
343 bb.note("Tainting hash to force rebuild of task %s, %s" % (fn, task))
344 bb.build.write_taint(task, d, fn)
345
346def dump_this_task(outfile, d):
347 import bb.parse
348 fn = d.getVar("BB_FILENAME", True)
349 task = "do_" + d.getVar("BB_CURRENTTASK", True)
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500350 referencestamp = bb.build.stamp_internal(task, d, None, True)
351 bb.parse.siggen.dump_sigtask(fn, task, outfile, "customfile:" + referencestamp)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500352
353def clean_basepath(a):
Brad Bishop37a0e4d2017-12-04 01:01:44 -0500354 mc = None
355 if a.startswith("multiconfig:"):
356 _, mc, a = a.split(":", 2)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500357 b = a.rsplit("/", 2)[1] + a.rsplit("/", 2)[2]
358 if a.startswith("virtual:"):
359 b = b + ":" + a.rsplit(":", 1)[0]
Brad Bishop37a0e4d2017-12-04 01:01:44 -0500360 if mc:
361 b = b + ":multiconfig:" + mc
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500362 return b
363
364def clean_basepaths(a):
365 b = {}
366 for x in a:
367 b[clean_basepath(x)] = a[x]
368 return b
369
370def clean_basepaths_list(a):
371 b = []
372 for x in a:
373 b.append(clean_basepath(x))
374 return b
375
376def compare_sigfiles(a, b, recursecb = None):
377 output = []
378
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600379 with open(a, 'rb') as f:
380 p1 = pickle.Unpickler(f)
381 a_data = p1.load()
382 with open(b, 'rb') as f:
383 p2 = pickle.Unpickler(f)
384 b_data = p2.load()
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500385
386 def dict_diff(a, b, whitelist=set()):
387 sa = set(a.keys())
388 sb = set(b.keys())
389 common = sa & sb
390 changed = set()
391 for i in common:
392 if a[i] != b[i] and i not in whitelist:
393 changed.add(i)
394 added = sb - sa
395 removed = sa - sb
396 return changed, added, removed
397
398 def file_checksums_diff(a, b):
399 from collections import Counter
400 # Handle old siginfo format
401 if isinstance(a, dict):
402 a = [(os.path.basename(f), cs) for f, cs in a.items()]
403 if isinstance(b, dict):
404 b = [(os.path.basename(f), cs) for f, cs in b.items()]
405 # Compare lists, ensuring we can handle duplicate filenames if they exist
406 removedcount = Counter(a)
407 removedcount.subtract(b)
408 addedcount = Counter(b)
409 addedcount.subtract(a)
410 added = []
411 for x in b:
412 if addedcount[x] > 0:
413 addedcount[x] -= 1
414 added.append(x)
415 removed = []
416 changed = []
417 for x in a:
418 if removedcount[x] > 0:
419 removedcount[x] -= 1
420 for y in added:
421 if y[0] == x[0]:
422 changed.append((x[0], x[1], y[1]))
423 added.remove(y)
424 break
425 else:
426 removed.append(x)
427 added = [x[0] for x in added]
428 removed = [x[0] for x in removed]
429 return changed, added, removed
430
431 if 'basewhitelist' in a_data and a_data['basewhitelist'] != b_data['basewhitelist']:
432 output.append("basewhitelist changed from '%s' to '%s'" % (a_data['basewhitelist'], b_data['basewhitelist']))
433 if a_data['basewhitelist'] and b_data['basewhitelist']:
434 output.append("changed items: %s" % a_data['basewhitelist'].symmetric_difference(b_data['basewhitelist']))
435
436 if 'taskwhitelist' in a_data and a_data['taskwhitelist'] != b_data['taskwhitelist']:
437 output.append("taskwhitelist changed from '%s' to '%s'" % (a_data['taskwhitelist'], b_data['taskwhitelist']))
438 if a_data['taskwhitelist'] and b_data['taskwhitelist']:
439 output.append("changed items: %s" % a_data['taskwhitelist'].symmetric_difference(b_data['taskwhitelist']))
440
441 if a_data['taskdeps'] != b_data['taskdeps']:
442 output.append("Task dependencies changed from:\n%s\nto:\n%s" % (sorted(a_data['taskdeps']), sorted(b_data['taskdeps'])))
443
444 if a_data['basehash'] != b_data['basehash']:
445 output.append("basehash changed from %s to %s" % (a_data['basehash'], b_data['basehash']))
446
447 changed, added, removed = dict_diff(a_data['gendeps'], b_data['gendeps'], a_data['basewhitelist'] & b_data['basewhitelist'])
448 if changed:
449 for dep in changed:
450 output.append("List of dependencies for variable %s changed from '%s' to '%s'" % (dep, a_data['gendeps'][dep], b_data['gendeps'][dep]))
451 if a_data['gendeps'][dep] and b_data['gendeps'][dep]:
452 output.append("changed items: %s" % a_data['gendeps'][dep].symmetric_difference(b_data['gendeps'][dep]))
453 if added:
454 for dep in added:
455 output.append("Dependency on variable %s was added" % (dep))
456 if removed:
457 for dep in removed:
458 output.append("Dependency on Variable %s was removed" % (dep))
459
460
461 changed, added, removed = dict_diff(a_data['varvals'], b_data['varvals'])
462 if changed:
463 for dep in changed:
464 output.append("Variable %s value changed from '%s' to '%s'" % (dep, a_data['varvals'][dep], b_data['varvals'][dep]))
465
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600466 if not 'file_checksum_values' in a_data:
467 a_data['file_checksum_values'] = {}
468 if not 'file_checksum_values' in b_data:
469 b_data['file_checksum_values'] = {}
470
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500471 changed, added, removed = file_checksums_diff(a_data['file_checksum_values'], b_data['file_checksum_values'])
472 if changed:
473 for f, old, new in changed:
474 output.append("Checksum for file %s changed from %s to %s" % (f, old, new))
475 if added:
476 for f in added:
477 output.append("Dependency on checksum of file %s was added" % (f))
478 if removed:
479 for f in removed:
480 output.append("Dependency on checksum of file %s was removed" % (f))
481
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600482 if not 'runtaskdeps' in a_data:
483 a_data['runtaskdeps'] = {}
484 if not 'runtaskdeps' in b_data:
485 b_data['runtaskdeps'] = {}
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500486
487 if len(a_data['runtaskdeps']) != len(b_data['runtaskdeps']):
488 changed = ["Number of task dependencies changed"]
489 else:
490 changed = []
491 for idx, task in enumerate(a_data['runtaskdeps']):
492 a = a_data['runtaskdeps'][idx]
493 b = b_data['runtaskdeps'][idx]
494 if a_data['runtaskhashes'][a] != b_data['runtaskhashes'][b]:
495 changed.append("%s with hash %s\n changed to\n%s with hash %s" % (a, a_data['runtaskhashes'][a], b, b_data['runtaskhashes'][b]))
496
497 if changed:
498 output.append("runtaskdeps changed from %s to %s" % (clean_basepaths_list(a_data['runtaskdeps']), clean_basepaths_list(b_data['runtaskdeps'])))
499 output.append("\n".join(changed))
500
501
502 if 'runtaskhashes' in a_data and 'runtaskhashes' in b_data:
503 a = a_data['runtaskhashes']
504 b = b_data['runtaskhashes']
505 changed, added, removed = dict_diff(a, b)
506 if added:
507 for dep in added:
508 bdep_found = False
509 if removed:
510 for bdep in removed:
511 if b[dep] == a[bdep]:
512 #output.append("Dependency on task %s was replaced by %s with same hash" % (dep, bdep))
513 bdep_found = True
514 if not bdep_found:
515 output.append("Dependency on task %s was added with hash %s" % (clean_basepath(dep), b[dep]))
516 if removed:
517 for dep in removed:
518 adep_found = False
519 if added:
520 for adep in added:
521 if b[adep] == a[dep]:
522 #output.append("Dependency on task %s was replaced by %s with same hash" % (adep, dep))
523 adep_found = True
524 if not adep_found:
525 output.append("Dependency on task %s was removed with hash %s" % (clean_basepath(dep), a[dep]))
526 if changed:
527 for dep in changed:
528 output.append("Hash for dependent task %s changed from %s to %s" % (clean_basepath(dep), a[dep], b[dep]))
529 if callable(recursecb):
530 # If a dependent hash changed, might as well print the line above and then defer to the changes in
531 # that hash since in all likelyhood, they're the same changes this task also saw.
532 recout = recursecb(dep, a[dep], b[dep])
533 if recout:
534 output = [output[-1]] + recout
535
536 a_taint = a_data.get('taint', None)
537 b_taint = b_data.get('taint', None)
538 if a_taint != b_taint:
539 output.append("Taint (by forced/invalidated task) changed from %s to %s" % (a_taint, b_taint))
540
541 return output
542
543
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500544def calc_basehash(sigdata):
545 task = sigdata['task']
546 basedata = sigdata['varvals'][task]
547
548 if basedata is None:
549 basedata = ''
550
551 alldeps = sigdata['taskdeps']
552 for dep in alldeps:
553 basedata = basedata + dep
554 val = sigdata['varvals'][dep]
555 if val is not None:
556 basedata = basedata + str(val)
557
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600558 return hashlib.md5(basedata.encode("utf-8")).hexdigest()
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500559
560def calc_taskhash(sigdata):
561 data = sigdata['basehash']
562
563 for dep in sigdata['runtaskdeps']:
564 data = data + sigdata['runtaskhashes'][dep]
565
566 for c in sigdata['file_checksum_values']:
Brad Bishop37a0e4d2017-12-04 01:01:44 -0500567 if c[1]:
568 data = data + c[1]
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500569
570 if 'taint' in sigdata:
571 if 'nostamp:' in sigdata['taint']:
572 data = data + sigdata['taint'][8:]
573 else:
574 data = data + sigdata['taint']
575
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600576 return hashlib.md5(data.encode("utf-8")).hexdigest()
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500577
578
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500579def dump_sigfile(a):
580 output = []
581
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600582 with open(a, 'rb') as f:
583 p1 = pickle.Unpickler(f)
584 a_data = p1.load()
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500585
586 output.append("basewhitelist: %s" % (a_data['basewhitelist']))
587
588 output.append("taskwhitelist: %s" % (a_data['taskwhitelist']))
589
590 output.append("Task dependencies: %s" % (sorted(a_data['taskdeps'])))
591
592 output.append("basehash: %s" % (a_data['basehash']))
593
594 for dep in a_data['gendeps']:
595 output.append("List of dependencies for variable %s is %s" % (dep, a_data['gendeps'][dep]))
596
597 for dep in a_data['varvals']:
598 output.append("Variable %s value is %s" % (dep, a_data['varvals'][dep]))
599
600 if 'runtaskdeps' in a_data:
601 output.append("Tasks this task depends on: %s" % (a_data['runtaskdeps']))
602
603 if 'file_checksum_values' in a_data:
604 output.append("This task depends on the checksums of files: %s" % (a_data['file_checksum_values']))
605
606 if 'runtaskhashes' in a_data:
607 for dep in a_data['runtaskhashes']:
608 output.append("Hash for dependent task %s is %s" % (dep, a_data['runtaskhashes'][dep]))
609
610 if 'taint' in a_data:
611 output.append("Tainted (by forced/invalidated task): %s" % a_data['taint'])
612
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500613 if 'task' in a_data:
614 computed_basehash = calc_basehash(a_data)
615 output.append("Computed base hash is %s and from file %s" % (computed_basehash, a_data['basehash']))
616 else:
617 output.append("Unable to compute base hash")
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500618
Patrick Williamsd8c66bc2016-06-20 12:57:21 -0500619 computed_taskhash = calc_taskhash(a_data)
620 output.append("Computed task hash is %s" % computed_taskhash)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500621
622 return output