Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 1 | # reproducible_build.bbclass |
| 2 | # |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 3 | # Sets SOURCE_DATE_EPOCH in each component's build environment. |
| 4 | # Upstream components (generally) respect this environment variable, |
| 5 | # using it in place of the "current" date and time. |
| 6 | # See https://reproducible-builds.org/specs/source-date-epoch/ |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 7 | # |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 8 | # After sources are unpacked but before they are patched, we set a reproducible value for SOURCE_DATE_EPOCH. |
| 9 | # This value should be reproducible for anyone who builds the same revision from the same sources. |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 10 | # |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 11 | # There are 4 ways we determine SOURCE_DATE_EPOCH: |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 12 | # |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 13 | # 1. Use the value from __source_date_epoch.txt file if this file exists. |
| 14 | # This file was most likely created in the previous build by one of the following methods 2,3,4. |
| 15 | # Alternatively, it can be provided by a recipe via SRC_URI. |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 16 | # |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 17 | # If the file does not exist: |
| 18 | # |
| 19 | # 2. If there is a git checkout, use the last git commit timestamp. |
| 20 | # Git does not preserve file timestamps on checkout. |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 21 | # |
| 22 | # 3. Use the mtime of "known" files such as NEWS, CHANGLELOG, ... |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 23 | # This works for well-kept repositories distributed via tarball. |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 24 | # |
Brad Bishop | a5c52ff | 2018-11-23 10:55:50 +1300 | [diff] [blame] | 25 | # 4. Use the modification time of the youngest file in the source tree, if there is one. |
| 26 | # This will be the newest file from the distribution tarball, if any. |
| 27 | # |
| 28 | # 5. Fall back to a fixed timestamp. |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 29 | # |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 30 | # Once the value of SOURCE_DATE_EPOCH is determined, it is stored in the recipe's SDE_FILE. |
| 31 | # If none of these mechanisms are suitable, replace the do_deploy_source_date_epoch task |
| 32 | # with recipe-specific functionality to write the appropriate SOURCE_DATE_EPOCH into the SDE_FILE. |
| 33 | # |
| 34 | # If this file is found by other tasks, the value is exported in the SOURCE_DATE_EPOCH variable. |
| 35 | # SOURCE_DATE_EPOCH is set for all tasks that might use it (do_configure, do_compile, do_package, ...) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 36 | |
| 37 | BUILD_REPRODUCIBLE_BINARIES ??= '1' |
| 38 | inherit ${@oe.utils.ifelse(d.getVar('BUILD_REPRODUCIBLE_BINARIES') == '1', 'reproducible_build_simple', '')} |
| 39 | |
| 40 | SDE_DIR ="${WORKDIR}/source-date-epoch" |
| 41 | SDE_FILE = "${SDE_DIR}/__source_date_epoch.txt" |
Brad Bishop | 00e122a | 2019-10-05 11:10:57 -0400 | [diff] [blame] | 42 | SDE_DEPLOYDIR = "${WORKDIR}/deploy-source-date-epoch" |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 43 | |
| 44 | SSTATETASKS += "do_deploy_source_date_epoch" |
| 45 | |
| 46 | do_deploy_source_date_epoch () { |
Brad Bishop | 00e122a | 2019-10-05 11:10:57 -0400 | [diff] [blame] | 47 | mkdir -p ${SDE_DEPLOYDIR} |
| 48 | if [ -e ${SDE_FILE} ]; then |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 49 | echo "Deploying SDE from ${SDE_FILE} -> ${SDE_DEPLOYDIR}." |
Brad Bishop | 00e122a | 2019-10-05 11:10:57 -0400 | [diff] [blame] | 50 | cp -p ${SDE_FILE} ${SDE_DEPLOYDIR}/__source_date_epoch.txt |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 51 | else |
| 52 | echo "${SDE_FILE} not found!" |
Brad Bishop | 00e122a | 2019-10-05 11:10:57 -0400 | [diff] [blame] | 53 | fi |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 54 | } |
| 55 | |
| 56 | python do_deploy_source_date_epoch_setscene () { |
| 57 | sstate_setscene(d) |
Brad Bishop | 00e122a | 2019-10-05 11:10:57 -0400 | [diff] [blame] | 58 | bb.utils.mkdirhier(d.getVar('SDE_DIR')) |
| 59 | sde_file = os.path.join(d.getVar('SDE_DEPLOYDIR'), '__source_date_epoch.txt') |
| 60 | if os.path.exists(sde_file): |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 61 | target = d.getVar('SDE_FILE') |
| 62 | bb.debug(1, "Moving setscene SDE file %s -> %s" % (sde_file, target)) |
| 63 | os.rename(sde_file, target) |
| 64 | else: |
| 65 | bb.debug(1, "%s not found!" % sde_file) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 66 | } |
| 67 | |
Brad Bishop | 00e122a | 2019-10-05 11:10:57 -0400 | [diff] [blame] | 68 | do_deploy_source_date_epoch[dirs] = "${SDE_DEPLOYDIR}" |
| 69 | do_deploy_source_date_epoch[sstate-plaindirs] = "${SDE_DEPLOYDIR}" |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 70 | addtask do_deploy_source_date_epoch_setscene |
| 71 | addtask do_deploy_source_date_epoch before do_configure after do_patch |
| 72 | |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 73 | def get_source_date_epoch_from_known_files(d, sourcedir): |
| 74 | source_date_epoch = None |
| 75 | newest_file = None |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 76 | known_files = set(["NEWS", "ChangeLog", "Changelog", "CHANGES"]) |
| 77 | for file in known_files: |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 78 | filepath = os.path.join(sourcedir, file) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 79 | if os.path.isfile(filepath): |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 80 | mtime = int(os.lstat(filepath).st_mtime) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 81 | # There may be more than one "known_file" present, if so, use the youngest one |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 82 | if not source_date_epoch or mtime > source_date_epoch: |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 83 | source_date_epoch = mtime |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 84 | newest_file = filepath |
| 85 | if newest_file: |
| 86 | bb.debug(1, "SOURCE_DATE_EPOCH taken from: %s" % newest_file) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 87 | return source_date_epoch |
| 88 | |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 89 | def find_git_folder(d, sourcedir): |
| 90 | # First guess: WORKDIR/git |
| 91 | # This is the default git fetcher unpack path |
| 92 | workdir = d.getVar('WORKDIR') |
| 93 | gitpath = os.path.join(workdir, "git/.git") |
| 94 | if os.path.isdir(gitpath): |
| 95 | return gitpath |
| 96 | |
| 97 | # Second guess: ${S} |
| 98 | gitpath = os.path.join(sourcedir, ".git") |
| 99 | if os.path.isdir(gitpath): |
| 100 | return gitpath |
| 101 | |
| 102 | # Perhaps there was a subpath or destsuffix specified. |
| 103 | # Go looking in the WORKDIR |
| 104 | exclude = set(["build", "image", "license-destdir", "patches", "pseudo", |
| 105 | "recipe-sysroot", "recipe-sysroot-native", "sysroot-destdir", "temp"]) |
| 106 | for root, dirs, files in os.walk(workdir, topdown=True): |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 107 | dirs[:] = [d for d in dirs if d not in exclude] |
| 108 | if '.git' in dirs: |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 109 | return root |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 110 | |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 111 | bb.warn("Failed to find a git repository in WORKDIR: %s" % workdir) |
| 112 | return None |
| 113 | |
| 114 | def get_source_date_epoch_from_git(d, sourcedir): |
| 115 | source_date_epoch = None |
| 116 | if "git://" in d.getVar('SRC_URI'): |
| 117 | gitpath = find_git_folder(d, sourcedir) |
| 118 | if gitpath: |
| 119 | import subprocess |
| 120 | source_date_epoch = int(subprocess.check_output(['git','log','-1','--pretty=%ct'], cwd=gitpath)) |
| 121 | bb.debug(1, "git repository: %s" % gitpath) |
| 122 | return source_date_epoch |
| 123 | |
| 124 | def get_source_date_epoch_from_youngest_file(d, sourcedir): |
Brad Bishop | a5c52ff | 2018-11-23 10:55:50 +1300 | [diff] [blame] | 125 | if sourcedir == d.getVar('WORKDIR'): |
| 126 | # These sources are almost certainly not from a tarball |
| 127 | return None |
| 128 | |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 129 | # Do it the hard way: check all files and find the youngest one... |
| 130 | source_date_epoch = None |
| 131 | newest_file = None |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 132 | for root, dirs, files in os.walk(sourcedir, topdown=True): |
| 133 | files = [f for f in files if not f[0] == '.'] |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 134 | |
| 135 | for fname in files: |
| 136 | filename = os.path.join(root, fname) |
| 137 | try: |
| 138 | mtime = int(os.lstat(filename).st_mtime) |
| 139 | except ValueError: |
| 140 | mtime = 0 |
| 141 | if not source_date_epoch or mtime > source_date_epoch: |
| 142 | source_date_epoch = mtime |
| 143 | newest_file = filename |
| 144 | |
| 145 | if newest_file: |
| 146 | bb.debug(1, "Newest file found: %s" % newest_file) |
| 147 | return source_date_epoch |
| 148 | |
Brad Bishop | a5c52ff | 2018-11-23 10:55:50 +1300 | [diff] [blame] | 149 | def fixed_source_date_epoch(): |
| 150 | bb.debug(1, "No tarball or git repo found to determine SOURCE_DATE_EPOCH") |
| 151 | return 0 |
| 152 | |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 153 | python create_source_date_epoch_stamp() { |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 154 | epochfile = d.getVar('SDE_FILE') |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 155 | # If it exists we need to regenerate as the sources may have changed |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 156 | if os.path.isfile(epochfile): |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 157 | bb.debug(1, "Deleting existing SOURCE_DATE_EPOCH from: %s" % epochfile) |
| 158 | os.remove(epochfile) |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 159 | |
| 160 | sourcedir = d.getVar('S') |
| 161 | source_date_epoch = ( |
| 162 | get_source_date_epoch_from_git(d, sourcedir) or |
| 163 | get_source_date_epoch_from_known_files(d, sourcedir) or |
| 164 | get_source_date_epoch_from_youngest_file(d, sourcedir) or |
Brad Bishop | a5c52ff | 2018-11-23 10:55:50 +1300 | [diff] [blame] | 165 | fixed_source_date_epoch() # Last resort |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 166 | ) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 167 | |
Brad Bishop | 1a4b7ee | 2018-12-16 17:11:34 -0800 | [diff] [blame] | 168 | bb.debug(1, "SOURCE_DATE_EPOCH: %d" % source_date_epoch) |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 169 | bb.utils.mkdirhier(d.getVar('SDE_DIR')) |
| 170 | with open(epochfile, 'w') as f: |
| 171 | f.write(str(source_date_epoch)) |
| 172 | } |
| 173 | |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 174 | def get_source_date_epoch_value(d): |
| 175 | cached = d.getVar('__CACHED_SOURCE_DATE_EPOCH') |
| 176 | if cached: |
| 177 | return cached |
| 178 | |
| 179 | epochfile = d.getVar('SDE_FILE') |
| 180 | source_date_epoch = 0 |
| 181 | if os.path.isfile(epochfile): |
| 182 | with open(epochfile, 'r') as f: |
| 183 | s = f.read() |
| 184 | try: |
| 185 | source_date_epoch = int(s) |
| 186 | except ValueError: |
| 187 | bb.warn("SOURCE_DATE_EPOCH value '%s' is invalid. Reverting to 0" % s) |
| 188 | source_date_epoch = 0 |
| 189 | bb.debug(1, "SOURCE_DATE_EPOCH: %d" % source_date_epoch) |
| 190 | else: |
| 191 | bb.debug(1, "Cannot find %s. SOURCE_DATE_EPOCH will default to %d" % (epochfile, source_date_epoch)) |
| 192 | |
| 193 | d.setVar('__CACHED_SOURCE_DATE_EPOCH', str(source_date_epoch)) |
| 194 | return str(source_date_epoch) |
| 195 | |
| 196 | export SOURCE_DATE_EPOCH ?= "${@get_source_date_epoch_value(d)}" |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 197 | BB_HASHBASE_WHITELIST += "SOURCE_DATE_EPOCH" |
| 198 | |
| 199 | python () { |
| 200 | if d.getVar('BUILD_REPRODUCIBLE_BINARIES') == '1': |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame^] | 201 | d.appendVarFlag("do_unpack", "postfuncs", " create_source_date_epoch_stamp") |
Brad Bishop | 316dfdd | 2018-06-25 12:45:53 -0400 | [diff] [blame] | 202 | } |