blob: 23f8c0da8f442341d8bd582b9ee3a60e66a3d083 [file] [log] [blame]
Patrick Williamsc124f4f2015-09-15 14:41:29 -05001"""
2BitBake 'Fetch' git implementation
3
4git fetcher support the SRC_URI with format of:
5SRC_URI = "git://some.host/somepath;OptionA=xxx;OptionB=xxx;..."
6
7Supported SRC_URI options are:
8
9- branch
10 The git branch to retrieve from. The default is "master"
11
12 This option also supports multiple branch fetching, with branches
13 separated by commas. In multiple branches case, the name option
14 must have the same number of names to match the branches, which is
15 used to specify the SRC_REV for the branch
16 e.g:
17 SRC_URI="git://some.host/somepath;branch=branchX,branchY;name=nameX,nameY"
18 SRCREV_nameX = "xxxxxxxxxxxxxxxxxxxx"
19 SRCREV_nameY = "YYYYYYYYYYYYYYYYYYYY"
20
21- tag
22 The git tag to retrieve. The default is "master"
23
24- protocol
25 The method to use to access the repository. Common options are "git",
26 "http", "https", "file", "ssh" and "rsync". The default is "git".
27
28- rebaseable
29 rebaseable indicates that the upstream git repo may rebase in the future,
30 and current revision may disappear from upstream repo. This option will
31 remind fetcher to preserve local cache carefully for future use.
32 The default value is "0", set rebaseable=1 for rebaseable git repo.
33
34- nocheckout
35 Don't checkout source code when unpacking. set this option for the recipe
36 who has its own routine to checkout code.
37 The default is "0", set nocheckout=1 if needed.
38
39- bareclone
40 Create a bare clone of the source code and don't checkout the source code
41 when unpacking. Set this option for the recipe who has its own routine to
42 checkout code and tracking branch requirements.
43 The default is "0", set bareclone=1 if needed.
44
45- nobranch
46 Don't check the SHA validation for branch. set this option for the recipe
47 referring to commit which is valid in tag instead of branch.
48 The default is "0", set nobranch=1 if needed.
49
Patrick Williamsc0f7c042017-02-23 20:41:17 -060050- usehead
Brad Bishop6e60e8b2018-02-01 10:27:11 -050051 For local git:// urls to use the current branch HEAD as the revision for use with
Patrick Williamsc0f7c042017-02-23 20:41:17 -060052 AUTOREV. Implies nobranch.
53
Patrick Williamsc124f4f2015-09-15 14:41:29 -050054"""
55
Brad Bishopc342db32019-05-15 21:57:59 -040056# Copyright (C) 2005 Richard Purdie
Patrick Williamsc124f4f2015-09-15 14:41:29 -050057#
Brad Bishopc342db32019-05-15 21:57:59 -040058# SPDX-License-Identifier: GPL-2.0-only
Patrick Williamsc124f4f2015-09-15 14:41:29 -050059#
Patrick Williamsc124f4f2015-09-15 14:41:29 -050060
Brad Bishopd7bf8c12018-02-25 22:55:05 -050061import collections
Patrick Williamsd7e96312015-09-22 08:09:05 -050062import errno
Brad Bishopd7bf8c12018-02-25 22:55:05 -050063import fnmatch
Patrick Williamsc124f4f2015-09-15 14:41:29 -050064import os
65import re
Andrew Geissler4c19ea12020-10-27 13:52:24 -050066import shlex
Brad Bishopd7bf8c12018-02-25 22:55:05 -050067import subprocess
68import tempfile
Patrick Williamsc124f4f2015-09-15 14:41:29 -050069import bb
Patrick Williamsc0f7c042017-02-23 20:41:17 -060070import bb.progress
Andrew Geissler5199d832021-09-24 16:47:35 -050071from contextlib import contextmanager
Patrick Williamsc124f4f2015-09-15 14:41:29 -050072from bb.fetch2 import FetchMethod
73from bb.fetch2 import runfetchcmd
74from bb.fetch2 import logger
75
Patrick Williamsc0f7c042017-02-23 20:41:17 -060076
Patrick Williams03907ee2022-05-01 06:28:52 -050077sha1_re = re.compile(r'^[0-9a-f]{40}$')
78slash_re = re.compile(r"/+")
79
Patrick Williamsc0f7c042017-02-23 20:41:17 -060080class GitProgressHandler(bb.progress.LineFilterProgressHandler):
81 """Extract progress information from git output"""
82 def __init__(self, d):
83 self._buffer = ''
84 self._count = 0
85 super(GitProgressHandler, self).__init__(d)
86 # Send an initial progress event so the bar gets shown
87 self._fire_progress(-1)
88
89 def write(self, string):
90 self._buffer += string
91 stages = ['Counting objects', 'Compressing objects', 'Receiving objects', 'Resolving deltas']
92 stage_weights = [0.2, 0.05, 0.5, 0.25]
93 stagenum = 0
94 for i, stage in reversed(list(enumerate(stages))):
95 if stage in self._buffer:
96 stagenum = i
97 self._buffer = ''
98 break
99 self._status = stages[stagenum]
100 percs = re.findall(r'(\d+)%', string)
101 if percs:
102 progress = int(round((int(percs[-1]) * stage_weights[stagenum]) + (sum(stage_weights[:stagenum]) * 100)))
103 rates = re.findall(r'([\d.]+ [a-zA-Z]*/s+)', string)
104 if rates:
105 rate = rates[-1]
106 else:
107 rate = None
108 self.update(progress, rate)
109 else:
110 if stagenum == 0:
111 percs = re.findall(r': (\d+)', string)
112 if percs:
113 count = int(percs[-1])
114 if count > self._count:
115 self._count = count
116 self._fire_progress(-count)
117 super(GitProgressHandler, self).write(string)
118
119
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500120class Git(FetchMethod):
Brad Bishop316dfdd2018-06-25 12:45:53 -0400121 bitbake_dir = os.path.abspath(os.path.join(os.path.dirname(os.path.join(os.path.abspath(__file__))), '..', '..', '..'))
122 make_shallow_path = os.path.join(bitbake_dir, 'bin', 'git-make-shallow')
123
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500124 """Class to fetch a module or modules from git repositories"""
125 def init(self, d):
126 pass
127
128 def supports(self, ud, d):
129 """
130 Check to see if a given url can be fetched with git.
131 """
132 return ud.type in ['git']
133
134 def supports_checksum(self, urldata):
135 return False
136
137 def urldata_init(self, ud, d):
138 """
139 init git specific variable within url data
140 so that the git method like latest_revision() can work
141 """
142 if 'protocol' in ud.parm:
143 ud.proto = ud.parm['protocol']
144 elif not ud.host:
145 ud.proto = 'file'
146 else:
147 ud.proto = "git"
Andrew Geissler595f6302022-01-24 19:11:47 +0000148 if ud.host == "github.com" and ud.proto == "git":
149 # github stopped supporting git protocol
150 # https://github.blog/2021-09-01-improving-git-protocol-security-github/#no-more-unauthenticated-git
151 ud.proto = "https"
152 bb.warn("URL: %s uses git protocol which is no longer supported by github. Please change to ;protocol=https in the url." % ud.url)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500153
154 if not ud.proto in ('git', 'file', 'ssh', 'http', 'https', 'rsync'):
155 raise bb.fetch2.ParameterError("Invalid protocol type", ud.url)
156
157 ud.nocheckout = ud.parm.get("nocheckout","0") == "1"
158
159 ud.rebaseable = ud.parm.get("rebaseable","0") == "1"
160
161 ud.nobranch = ud.parm.get("nobranch","0") == "1"
162
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600163 # usehead implies nobranch
164 ud.usehead = ud.parm.get("usehead","0") == "1"
165 if ud.usehead:
166 if ud.proto != "file":
167 raise bb.fetch2.ParameterError("The usehead option is only for use with local ('protocol=file') git repositories", ud.url)
168 ud.nobranch = 1
169
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500170 # bareclone implies nocheckout
171 ud.bareclone = ud.parm.get("bareclone","0") == "1"
172 if ud.bareclone:
173 ud.nocheckout = 1
174
175 ud.unresolvedrev = {}
Andrew Geissler595f6302022-01-24 19:11:47 +0000176 branches = ud.parm.get("branch", "").split(',')
177 if branches == [""] and not ud.nobranch:
178 bb.warn("URL: %s does not set any branch parameter. The future default branch used by tools and repositories is uncertain and we will therefore soon require this is set in all git urls." % ud.url)
179 branches = ["master"]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500180 if len(branches) != len(ud.names):
181 raise bb.fetch2.ParameterError("The number of name and branch parameters is not balanced", ud.url)
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500182
Andrew Geisslerc926e172021-05-07 16:11:35 -0500183 ud.noshared = d.getVar("BB_GIT_NOSHARED") == "1"
184
185 ud.cloneflags = "-n"
186 if not ud.noshared:
187 ud.cloneflags += " -s"
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500188 if ud.bareclone:
189 ud.cloneflags += " --mirror"
190
191 ud.shallow = d.getVar("BB_GIT_SHALLOW") == "1"
192 ud.shallow_extra_refs = (d.getVar("BB_GIT_SHALLOW_EXTRA_REFS") or "").split()
193
194 depth_default = d.getVar("BB_GIT_SHALLOW_DEPTH")
195 if depth_default is not None:
196 try:
197 depth_default = int(depth_default or 0)
198 except ValueError:
199 raise bb.fetch2.FetchError("Invalid depth for BB_GIT_SHALLOW_DEPTH: %s" % depth_default)
200 else:
201 if depth_default < 0:
202 raise bb.fetch2.FetchError("Invalid depth for BB_GIT_SHALLOW_DEPTH: %s" % depth_default)
203 else:
204 depth_default = 1
205 ud.shallow_depths = collections.defaultdict(lambda: depth_default)
206
Brad Bishop19323692019-04-05 15:28:33 -0400207 revs_default = d.getVar("BB_GIT_SHALLOW_REVS")
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500208 ud.shallow_revs = []
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500209 ud.branches = {}
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500210 for pos, name in enumerate(ud.names):
211 branch = branches[pos]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500212 ud.branches[name] = branch
213 ud.unresolvedrev[name] = branch
214
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500215 shallow_depth = d.getVar("BB_GIT_SHALLOW_DEPTH_%s" % name)
216 if shallow_depth is not None:
217 try:
218 shallow_depth = int(shallow_depth or 0)
219 except ValueError:
220 raise bb.fetch2.FetchError("Invalid depth for BB_GIT_SHALLOW_DEPTH_%s: %s" % (name, shallow_depth))
221 else:
222 if shallow_depth < 0:
223 raise bb.fetch2.FetchError("Invalid depth for BB_GIT_SHALLOW_DEPTH_%s: %s" % (name, shallow_depth))
224 ud.shallow_depths[name] = shallow_depth
225
226 revs = d.getVar("BB_GIT_SHALLOW_REVS_%s" % name)
227 if revs is not None:
228 ud.shallow_revs.extend(revs.split())
229 elif revs_default is not None:
230 ud.shallow_revs.extend(revs_default.split())
231
232 if (ud.shallow and
233 not ud.shallow_revs and
234 all(ud.shallow_depths[n] == 0 for n in ud.names)):
235 # Shallow disabled for this URL
236 ud.shallow = False
237
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600238 if ud.usehead:
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600239 # When usehead is set let's associate 'HEAD' with the unresolved
240 # rev of this repository. This will get resolved into a revision
241 # later. If an actual revision happens to have also been provided
242 # then this setting will be overridden.
243 for name in ud.names:
244 ud.unresolvedrev[name] = 'HEAD'
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600245
Andrew Geisslerd5838332022-05-27 11:33:10 -0500246 ud.basecmd = d.getVar("FETCHCMD_git") or "git -c core.fsyncobjectfiles=0 -c gc.autoDetach=false -c core.pager=cat"
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500247
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500248 write_tarballs = d.getVar("BB_GENERATE_MIRROR_TARBALLS") or "0"
249 ud.write_tarballs = write_tarballs != "0" or ud.rebaseable
250 ud.write_shallow_tarballs = (d.getVar("BB_GENERATE_SHALLOW_TARBALLS") or write_tarballs) != "0"
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500251
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500252 ud.setup_revisions(d)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500253
254 for name in ud.names:
Patrick Williams03907ee2022-05-01 06:28:52 -0500255 # Ensure any revision that doesn't look like a SHA-1 is translated into one
256 if not sha1_re.match(ud.revisions[name] or ''):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500257 if ud.revisions[name]:
258 ud.unresolvedrev[name] = ud.revisions[name]
259 ud.revisions[name] = self.latest_revision(ud, d, name)
260
Andrew Geisslerc3d88e42020-10-02 09:45:00 -0500261 gitsrcname = '%s%s' % (ud.host.replace(':', '.'), ud.path.replace('/', '.').replace('*', '.').replace(' ','_'))
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500262 if gitsrcname.startswith('.'):
263 gitsrcname = gitsrcname[1:]
264
Patrick Williams03907ee2022-05-01 06:28:52 -0500265 # For a rebaseable git repo, it is necessary to keep a mirror tar ball
266 # per revision, so that even if the revision disappears from the
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500267 # upstream repo in the future, the mirror will remain intact and still
Patrick Williams03907ee2022-05-01 06:28:52 -0500268 # contain the revision
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500269 if ud.rebaseable:
270 for name in ud.names:
271 gitsrcname = gitsrcname + '_' + ud.revisions[name]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500272
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500273 dl_dir = d.getVar("DL_DIR")
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800274 gitdir = d.getVar("GITDIR") or (dl_dir + "/git2")
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500275 ud.clonedir = os.path.join(gitdir, gitsrcname)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500276 ud.localfile = ud.clonedir
277
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500278 mirrortarball = 'git2_%s.tar.gz' % gitsrcname
279 ud.fullmirror = os.path.join(dl_dir, mirrortarball)
280 ud.mirrortarballs = [mirrortarball]
281 if ud.shallow:
282 tarballname = gitsrcname
283 if ud.bareclone:
284 tarballname = "%s_bare" % tarballname
285
286 if ud.shallow_revs:
287 tarballname = "%s_%s" % (tarballname, "_".join(sorted(ud.shallow_revs)))
288
289 for name, revision in sorted(ud.revisions.items()):
290 tarballname = "%s_%s" % (tarballname, ud.revisions[name][:7])
291 depth = ud.shallow_depths[name]
292 if depth:
293 tarballname = "%s-%s" % (tarballname, depth)
294
295 shallow_refs = []
296 if not ud.nobranch:
297 shallow_refs.extend(ud.branches.values())
298 if ud.shallow_extra_refs:
299 shallow_refs.extend(r.replace('refs/heads/', '').replace('*', 'ALL') for r in ud.shallow_extra_refs)
300 if shallow_refs:
301 tarballname = "%s_%s" % (tarballname, "_".join(sorted(shallow_refs)).replace('/', '.'))
302
303 fetcher = self.__class__.__name__.lower()
304 ud.shallowtarball = '%sshallow_%s.tar.gz' % (fetcher, tarballname)
305 ud.fullshallow = os.path.join(dl_dir, ud.shallowtarball)
306 ud.mirrortarballs.insert(0, ud.shallowtarball)
307
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500308 def localpath(self, ud, d):
309 return ud.clonedir
310
311 def need_update(self, ud, d):
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800312 return self.clonedir_need_update(ud, d) or self.shallow_tarball_need_update(ud) or self.tarball_need_update(ud)
313
314 def clonedir_need_update(self, ud, d):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500315 if not os.path.exists(ud.clonedir):
316 return True
Brad Bishop64c979e2019-11-04 13:55:29 -0500317 if ud.shallow and ud.write_shallow_tarballs and self.clonedir_need_shallow_revs(ud, d):
318 return True
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500319 for name in ud.names:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600320 if not self._contains_ref(ud, d, name, ud.clonedir):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500321 return True
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500322 return False
323
Brad Bishop64c979e2019-11-04 13:55:29 -0500324 def clonedir_need_shallow_revs(self, ud, d):
325 for rev in ud.shallow_revs:
326 try:
327 runfetchcmd('%s rev-parse -q --verify %s' % (ud.basecmd, rev), d, quiet=True, workdir=ud.clonedir)
328 except bb.fetch2.FetchError:
329 return rev
330 return None
331
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800332 def shallow_tarball_need_update(self, ud):
333 return ud.shallow and ud.write_shallow_tarballs and not os.path.exists(ud.fullshallow)
334
335 def tarball_need_update(self, ud):
336 return ud.write_tarballs and not os.path.exists(ud.fullmirror)
337
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500338 def try_premirror(self, ud, d):
339 # If we don't do this, updating an existing checkout with only premirrors
340 # is not possible
Brad Bishop19323692019-04-05 15:28:33 -0400341 if bb.utils.to_boolean(d.getVar("BB_FETCH_PREMIRRORONLY")):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500342 return True
343 if os.path.exists(ud.clonedir):
344 return False
345 return True
346
347 def download(self, ud, d):
348 """Fetch url"""
349
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500350 # A current clone is preferred to either tarball, a shallow tarball is
351 # preferred to an out of date clone, and a missing clone will use
352 # either tarball.
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800353 if ud.shallow and os.path.exists(ud.fullshallow) and self.need_update(ud, d):
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500354 ud.localpath = ud.fullshallow
355 return
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800356 elif os.path.exists(ud.fullmirror) and not os.path.exists(ud.clonedir):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500357 bb.utils.mkdirhier(ud.clonedir)
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500358 runfetchcmd("tar -xzf %s" % ud.fullmirror, d, workdir=ud.clonedir)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500359
360 repourl = self._get_repo_url(ud)
361
362 # If the repo still doesn't exist, fallback to cloning it
363 if not os.path.exists(ud.clonedir):
364 # We do this since git will use a "-l" option automatically for local urls where possible
365 if repourl.startswith("file://"):
366 repourl = repourl[7:]
Andrew Geissler4c19ea12020-10-27 13:52:24 -0500367 clone_cmd = "LANG=C %s clone --bare --mirror %s %s --progress" % (ud.basecmd, shlex.quote(repourl), ud.clonedir)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500368 if ud.proto.lower() != 'file':
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500369 bb.fetch2.check_network_access(d, clone_cmd, ud.url)
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600370 progresshandler = GitProgressHandler(d)
371 runfetchcmd(clone_cmd, d, log=progresshandler)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500372
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500373 # Update the checkout if needed
Brad Bishop64c979e2019-11-04 13:55:29 -0500374 if self.clonedir_need_update(ud, d):
Brad Bishop6ef32652018-10-09 18:59:25 +0100375 output = runfetchcmd("%s remote" % ud.basecmd, d, quiet=True, workdir=ud.clonedir)
376 if "origin" in output:
377 runfetchcmd("%s remote rm origin" % ud.basecmd, d, workdir=ud.clonedir)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500378
Andrew Geissler4c19ea12020-10-27 13:52:24 -0500379 runfetchcmd("%s remote add --mirror=fetch origin %s" % (ud.basecmd, shlex.quote(repourl)), d, workdir=ud.clonedir)
380 fetch_cmd = "LANG=C %s fetch -f --progress %s refs/*:refs/*" % (ud.basecmd, shlex.quote(repourl))
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500381 if ud.proto.lower() != 'file':
382 bb.fetch2.check_network_access(d, fetch_cmd, ud.url)
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600383 progresshandler = GitProgressHandler(d)
384 runfetchcmd(fetch_cmd, d, log=progresshandler, workdir=ud.clonedir)
385 runfetchcmd("%s prune-packed" % ud.basecmd, d, workdir=ud.clonedir)
Brad Bishop316dfdd2018-06-25 12:45:53 -0400386 runfetchcmd("%s pack-refs --all" % ud.basecmd, d, workdir=ud.clonedir)
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600387 runfetchcmd("%s pack-redundant --all | xargs -r rm" % ud.basecmd, d, workdir=ud.clonedir)
Patrick Williamsd7e96312015-09-22 08:09:05 -0500388 try:
389 os.unlink(ud.fullmirror)
390 except OSError as exc:
391 if exc.errno != errno.ENOENT:
392 raise
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800393
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500394 for name in ud.names:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600395 if not self._contains_ref(ud, d, name, ud.clonedir):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500396 raise bb.fetch2.FetchError("Unable to find revision %s in branch %s even from upstream" % (ud.revisions[name], ud.branches[name]))
397
Brad Bishop64c979e2019-11-04 13:55:29 -0500398 if ud.shallow and ud.write_shallow_tarballs:
399 missing_rev = self.clonedir_need_shallow_revs(ud, d)
400 if missing_rev:
401 raise bb.fetch2.FetchError("Unable to find revision %s even from upstream" % missing_rev)
402
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600403 if self._contains_lfs(ud, d, ud.clonedir) and self._need_lfs(ud):
404 # Unpack temporary working copy, use it to run 'git checkout' to force pre-fetching
Andrew Geissler7e0e3c02022-02-25 20:34:39 +0000405 # of all LFS blobs needed at the srcrev.
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600406 #
407 # It would be nice to just do this inline here by running 'git-lfs fetch'
408 # on the bare clonedir, but that operation requires a working copy on some
409 # releases of Git LFS.
410 tmpdir = tempfile.mkdtemp(dir=d.getVar('DL_DIR'))
411 try:
412 # Do the checkout. This implicitly involves a Git LFS fetch.
Andrew Geisslerc926e172021-05-07 16:11:35 -0500413 Git.unpack(self, ud, tmpdir, d)
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600414
415 # Scoop up a copy of any stuff that Git LFS downloaded. Merge them into
416 # the bare clonedir.
417 #
418 # As this procedure is invoked repeatedly on incremental fetches as
419 # a recipe's SRCREV is bumped throughout its lifetime, this will
420 # result in a gradual accumulation of LFS blobs in <ud.clonedir>/lfs
421 # corresponding to all the blobs reachable from the different revs
422 # fetched across time.
423 #
424 # Only do this if the unpack resulted in a .git/lfs directory being
425 # created; this only happens if at least one blob needed to be
426 # downloaded.
427 if os.path.exists(os.path.join(tmpdir, "git", ".git", "lfs")):
428 runfetchcmd("tar -cf - lfs | tar -xf - -C %s" % ud.clonedir, d, workdir="%s/git/.git" % tmpdir)
429 finally:
430 bb.utils.remove(tmpdir, recurse=True)
431
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500432 def build_mirror_data(self, ud, d):
Andrew Geissler5199d832021-09-24 16:47:35 -0500433
434 # Create as a temp file and move atomically into position to avoid races
435 @contextmanager
436 def create_atomic(filename):
437 fd, tfile = tempfile.mkstemp(dir=os.path.dirname(filename))
438 try:
439 yield tfile
440 umask = os.umask(0o666)
441 os.umask(umask)
442 os.chmod(tfile, (0o666 & ~umask))
443 os.rename(tfile, filename)
444 finally:
445 os.close(fd)
446
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500447 if ud.shallow and ud.write_shallow_tarballs:
448 if not os.path.exists(ud.fullshallow):
449 if os.path.islink(ud.fullshallow):
450 os.unlink(ud.fullshallow)
451 tempdir = tempfile.mkdtemp(dir=d.getVar('DL_DIR'))
452 shallowclone = os.path.join(tempdir, 'git')
453 try:
454 self.clone_shallow_local(ud, shallowclone, d)
455
456 logger.info("Creating tarball of git repository")
Andrew Geissler5199d832021-09-24 16:47:35 -0500457 with create_atomic(ud.fullshallow) as tfile:
458 runfetchcmd("tar -czf %s ." % tfile, d, workdir=shallowclone)
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500459 runfetchcmd("touch %s.done" % ud.fullshallow, d)
460 finally:
461 bb.utils.remove(tempdir, recurse=True)
462 elif ud.write_tarballs and not os.path.exists(ud.fullmirror):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500463 if os.path.islink(ud.fullmirror):
464 os.unlink(ud.fullmirror)
465
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500466 logger.info("Creating tarball of git repository")
Andrew Geissler5199d832021-09-24 16:47:35 -0500467 with create_atomic(ud.fullmirror) as tfile:
Andrew Geissler9aee5002022-03-30 16:27:02 +0000468 mtime = runfetchcmd("git log --all -1 --format=%cD", d,
469 quiet=True, workdir=ud.clonedir)
Patrick Williams03907ee2022-05-01 06:28:52 -0500470 runfetchcmd("tar -czf %s --owner oe:0 --group oe:0 --mtime \"%s\" ."
Andrew Geissler9aee5002022-03-30 16:27:02 +0000471 % (tfile, mtime), d, workdir=ud.clonedir)
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500472 runfetchcmd("touch %s.done" % ud.fullmirror, d)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500473
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500474 def clone_shallow_local(self, ud, dest, d):
475 """Clone the repo and make it shallow.
476
477 The upstream url of the new clone isn't set at this time, as it'll be
478 set correctly when unpacked."""
479 runfetchcmd("%s clone %s %s %s" % (ud.basecmd, ud.cloneflags, ud.clonedir, dest), d)
480
481 to_parse, shallow_branches = [], []
482 for name in ud.names:
483 revision = ud.revisions[name]
484 depth = ud.shallow_depths[name]
485 if depth:
486 to_parse.append('%s~%d^{}' % (revision, depth - 1))
487
488 # For nobranch, we need a ref, otherwise the commits will be
489 # removed, and for non-nobranch, we truncate the branch to our
490 # srcrev, to avoid keeping unnecessary history beyond that.
491 branch = ud.branches[name]
492 if ud.nobranch:
493 ref = "refs/shallow/%s" % name
494 elif ud.bareclone:
495 ref = "refs/heads/%s" % branch
496 else:
497 ref = "refs/remotes/origin/%s" % branch
498
499 shallow_branches.append(ref)
500 runfetchcmd("%s update-ref %s %s" % (ud.basecmd, ref, revision), d, workdir=dest)
501
502 # Map srcrev+depths to revisions
503 parsed_depths = runfetchcmd("%s rev-parse %s" % (ud.basecmd, " ".join(to_parse)), d, workdir=dest)
504
505 # Resolve specified revisions
506 parsed_revs = runfetchcmd("%s rev-parse %s" % (ud.basecmd, " ".join('"%s^{}"' % r for r in ud.shallow_revs)), d, workdir=dest)
507 shallow_revisions = parsed_depths.splitlines() + parsed_revs.splitlines()
508
509 # Apply extra ref wildcards
510 all_refs = runfetchcmd('%s for-each-ref "--format=%%(refname)"' % ud.basecmd,
511 d, workdir=dest).splitlines()
512 for r in ud.shallow_extra_refs:
513 if not ud.bareclone:
514 r = r.replace('refs/heads/', 'refs/remotes/origin/')
515
516 if '*' in r:
517 matches = filter(lambda a: fnmatch.fnmatchcase(a, r), all_refs)
518 shallow_branches.extend(matches)
519 else:
520 shallow_branches.append(r)
521
522 # Make the repository shallow
Brad Bishop316dfdd2018-06-25 12:45:53 -0400523 shallow_cmd = [self.make_shallow_path, '-s']
Brad Bishopd7bf8c12018-02-25 22:55:05 -0500524 for b in shallow_branches:
525 shallow_cmd.append('-r')
526 shallow_cmd.append(b)
527 shallow_cmd.extend(shallow_revisions)
528 runfetchcmd(subprocess.list2cmdline(shallow_cmd), d, workdir=dest)
529
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500530 def unpack(self, ud, destdir, d):
531 """ unpack the downloaded src to destdir"""
532
Andrew Geissler595f6302022-01-24 19:11:47 +0000533 subdir = ud.parm.get("subdir")
534 subpath = ud.parm.get("subpath")
535 readpathspec = ""
536 def_destsuffix = "git/"
537
538 if subpath:
539 readpathspec = ":%s" % subpath
540 def_destsuffix = "%s/" % os.path.basename(subpath.rstrip('/'))
541
542 if subdir:
543 # If 'subdir' param exists, create a dir and use it as destination for unpack cmd
544 if os.path.isabs(subdir):
545 if not os.path.realpath(subdir).startswith(os.path.realpath(destdir)):
546 raise bb.fetch2.UnpackError("subdir argument isn't a subdirectory of unpack root %s" % destdir, ud.url)
547 destdir = subdir
548 else:
549 destdir = os.path.join(destdir, subdir)
550 def_destsuffix = ""
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500551
552 destsuffix = ud.parm.get("destsuffix", def_destsuffix)
553 destdir = ud.destdir = os.path.join(destdir, destsuffix)
554 if os.path.exists(destdir):
555 bb.utils.prunedir(destdir)
556
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600557 need_lfs = self._need_lfs(ud)
Brad Bishopa34c0302019-09-23 22:34:48 -0400558
Andrew Geissler4ed12e12020-06-05 18:00:41 -0500559 if not need_lfs:
560 ud.basecmd = "GIT_LFS_SKIP_SMUDGE=1 " + ud.basecmd
561
Brad Bishop1a4b7ee2018-12-16 17:11:34 -0800562 source_found = False
563 source_error = []
564
565 if not source_found:
566 clonedir_is_up_to_date = not self.clonedir_need_update(ud, d)
567 if clonedir_is_up_to_date:
568 runfetchcmd("%s clone %s %s/ %s" % (ud.basecmd, ud.cloneflags, ud.clonedir, destdir), d)
569 source_found = True
570 else:
571 source_error.append("clone directory not available or not up to date: " + ud.clonedir)
572
573 if not source_found:
574 if ud.shallow:
575 if os.path.exists(ud.fullshallow):
576 bb.utils.mkdirhier(destdir)
577 runfetchcmd("tar -xzf %s" % ud.fullshallow, d, workdir=destdir)
578 source_found = True
579 else:
580 source_error.append("shallow clone not available: " + ud.fullshallow)
581 else:
582 source_error.append("shallow clone not enabled")
583
584 if not source_found:
585 raise bb.fetch2.UnpackError("No up to date source found: " + "; ".join(source_error), ud.url)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500586
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500587 repourl = self._get_repo_url(ud)
Andrew Geissler4c19ea12020-10-27 13:52:24 -0500588 runfetchcmd("%s remote set-url origin %s" % (ud.basecmd, shlex.quote(repourl)), d, workdir=destdir)
Brad Bishopc342db32019-05-15 21:57:59 -0400589
590 if self._contains_lfs(ud, d, destdir):
Brad Bishop00e122a2019-10-05 11:10:57 -0400591 if need_lfs and not self._find_git_lfs(d):
592 raise bb.fetch2.FetchError("Repository %s has LFS content, install git-lfs on host to download (or set lfs=0 to ignore it)" % (repourl))
Andrew Geissler4ed12e12020-06-05 18:00:41 -0500593 elif not need_lfs:
Brad Bishopa34c0302019-09-23 22:34:48 -0400594 bb.note("Repository %s has LFS content but it is not being fetched" % (repourl))
Brad Bishopc342db32019-05-15 21:57:59 -0400595
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500596 if not ud.nocheckout:
Andrew Geissler595f6302022-01-24 19:11:47 +0000597 if subpath:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600598 runfetchcmd("%s read-tree %s%s" % (ud.basecmd, ud.revisions[ud.names[0]], readpathspec), d,
599 workdir=destdir)
600 runfetchcmd("%s checkout-index -q -f -a" % ud.basecmd, d, workdir=destdir)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500601 elif not ud.nobranch:
602 branchname = ud.branches[ud.names[0]]
603 runfetchcmd("%s checkout -B %s %s" % (ud.basecmd, branchname, \
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600604 ud.revisions[ud.names[0]]), d, workdir=destdir)
Andre Rosa49271d42017-09-07 11:15:55 +0200605 runfetchcmd("%s branch %s --set-upstream-to origin/%s" % (ud.basecmd, branchname, \
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600606 branchname), d, workdir=destdir)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500607 else:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600608 runfetchcmd("%s checkout %s" % (ud.basecmd, ud.revisions[ud.names[0]]), d, workdir=destdir)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500609
610 return True
611
612 def clean(self, ud, d):
613 """ clean the git directory """
614
Brad Bishop19323692019-04-05 15:28:33 -0400615 to_remove = [ud.localpath, ud.fullmirror, ud.fullmirror + ".done"]
616 # The localpath is a symlink to clonedir when it is cloned from a
617 # mirror, so remove both of them.
618 if os.path.islink(ud.localpath):
619 clonedir = os.path.realpath(ud.localpath)
620 to_remove.append(clonedir)
621
622 for r in to_remove:
623 if os.path.exists(r):
624 bb.note('Removing %s' % r)
625 bb.utils.remove(r, True)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500626
627 def supports_srcrev(self):
628 return True
629
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600630 def _contains_ref(self, ud, d, name, wd):
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500631 cmd = ""
632 if ud.nobranch:
633 cmd = "%s log --pretty=oneline -n 1 %s -- 2> /dev/null | wc -l" % (
634 ud.basecmd, ud.revisions[name])
635 else:
636 cmd = "%s branch --contains %s --list %s 2> /dev/null | wc -l" % (
637 ud.basecmd, ud.revisions[name], ud.branches[name])
638 try:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600639 output = runfetchcmd(cmd, d, quiet=True, workdir=wd)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500640 except bb.fetch2.FetchError:
641 return False
642 if len(output.split()) > 1:
643 raise bb.fetch2.FetchError("The command '%s' gave output with more then 1 line unexpectedly, output: '%s'" % (cmd, output))
644 return output.split()[0] != "0"
645
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600646 def _need_lfs(self, ud):
647 return ud.parm.get("lfs", "1") == "1"
648
Brad Bishopc342db32019-05-15 21:57:59 -0400649 def _contains_lfs(self, ud, d, wd):
650 """
651 Check if the repository has 'lfs' (large file) content
652 """
Andrew Geissler4ed12e12020-06-05 18:00:41 -0500653
654 if not ud.nobranch:
655 branchname = ud.branches[ud.names[0]]
656 else:
657 branchname = "master"
658
Andrew Geisslerd1e89492021-02-12 15:35:20 -0600659 # The bare clonedir doesn't use the remote names; it has the branch immediately.
660 if wd == ud.clonedir:
661 refname = ud.branches[ud.names[0]]
662 else:
663 refname = "origin/%s" % ud.branches[ud.names[0]]
664
665 cmd = "%s grep lfs %s:.gitattributes | wc -l" % (
666 ud.basecmd, refname)
Andrew Geissler4ed12e12020-06-05 18:00:41 -0500667
Brad Bishopc342db32019-05-15 21:57:59 -0400668 try:
669 output = runfetchcmd(cmd, d, quiet=True, workdir=wd)
670 if int(output) > 0:
671 return True
672 except (bb.fetch2.FetchError,ValueError):
673 pass
674 return False
675
Brad Bishop00e122a2019-10-05 11:10:57 -0400676 def _find_git_lfs(self, d):
677 """
678 Return True if git-lfs can be found, False otherwise.
679 """
680 import shutil
681 return shutil.which("git-lfs", path=d.getVar('PATH')) is not None
682
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500683 def _get_repo_url(self, ud):
684 """
685 Return the repository URL
686 """
Andrew Geissler6ce62a22020-11-30 19:58:47 -0600687 # Note that we do not support passwords directly in the git urls. There are several
688 # reasons. SRC_URI can be written out to things like buildhistory and people don't
689 # want to leak passwords like that. Its also all too easy to share metadata without
690 # removing the password. ssh keys, ~/.netrc and ~/.ssh/config files can be used as
691 # alternatives so we will not take patches adding password support here.
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500692 if ud.user:
693 username = ud.user + '@'
694 else:
695 username = ""
696 return "%s://%s%s%s" % (ud.proto, username, ud.host, ud.path)
697
698 def _revision_key(self, ud, d, name):
699 """
700 Return a unique key for the url
701 """
Andrew Geissler82c905d2020-04-13 13:39:40 -0500702 # Collapse adjacent slashes
Andrew Geissler82c905d2020-04-13 13:39:40 -0500703 return "git:" + ud.host + slash_re.sub(".", ud.path) + ud.unresolvedrev[name]
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500704
705 def _lsremote(self, ud, d, search):
706 """
707 Run git ls-remote with the specified search string
708 """
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500709 # Prevent recursion e.g. in OE if SRCPV is in PV, PV is in WORKDIR,
710 # and WORKDIR is in PATH (as a result of RSS), our call to
711 # runfetchcmd() exports PATH so this function will get called again (!)
712 # In this scenario the return call of the function isn't actually
713 # important - WORKDIR isn't needed in PATH to call git ls-remote
714 # anyway.
715 if d.getVar('_BB_GIT_IN_LSREMOTE', False):
716 return ''
717 d.setVar('_BB_GIT_IN_LSREMOTE', '1')
718 try:
719 repourl = self._get_repo_url(ud)
Andrew Geissler4c19ea12020-10-27 13:52:24 -0500720 cmd = "%s ls-remote %s %s" % \
721 (ud.basecmd, shlex.quote(repourl), search)
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500722 if ud.proto.lower() != 'file':
723 bb.fetch2.check_network_access(d, cmd, repourl)
724 output = runfetchcmd(cmd, d, True)
725 if not output:
726 raise bb.fetch2.FetchError("The command %s gave empty output unexpectedly" % cmd, ud.url)
727 finally:
728 d.delVar('_BB_GIT_IN_LSREMOTE')
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500729 return output
730
731 def _latest_revision(self, ud, d, name):
732 """
733 Compute the HEAD revision for the url
734 """
Andrew Geissler7e0e3c02022-02-25 20:34:39 +0000735 if not d.getVar("__BBSEENSRCREV"):
736 raise bb.fetch2.FetchError("Recipe uses a floating tag/branch without a fixed SRCREV yet doesn't call bb.fetch2.get_srcrev() (use SRCPV in PV for OE).")
737
738 # Ensure we mark as not cached
739 bb.fetch2.get_autorev(d)
740
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500741 output = self._lsremote(ud, d, "")
742 # Tags of the form ^{} may not work, need to fallback to other form
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600743 if ud.unresolvedrev[name][:5] == "refs/" or ud.usehead:
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500744 head = ud.unresolvedrev[name]
745 tag = ud.unresolvedrev[name]
746 else:
747 head = "refs/heads/%s" % ud.unresolvedrev[name]
748 tag = "refs/tags/%s" % ud.unresolvedrev[name]
749 for s in [head, tag + "^{}", tag]:
Patrick Williamsc0f7c042017-02-23 20:41:17 -0600750 for l in output.strip().split('\n'):
751 sha1, ref = l.split()
752 if s == ref:
753 return sha1
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500754 raise bb.fetch2.FetchError("Unable to resolve '%s' in upstream git repository in git ls-remote output for %s" % \
755 (ud.unresolvedrev[name], ud.host+ud.path))
756
757 def latest_versionstring(self, ud, d):
758 """
759 Compute the latest release name like "x.y.x" in "x.y.x+gitHASH"
760 by searching through the tags output of ls-remote, comparing
761 versions and returning the highest match.
762 """
763 pupver = ('', '')
764
Brad Bishop19323692019-04-05 15:28:33 -0400765 tagregex = re.compile(d.getVar('UPSTREAM_CHECK_GITTAGREGEX') or r"(?P<pver>([0-9][\.|_]?)+)")
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500766 try:
767 output = self._lsremote(ud, d, "refs/tags/*")
Brad Bishop316dfdd2018-06-25 12:45:53 -0400768 except (bb.fetch2.FetchError, bb.fetch2.NetworkAccess) as e:
769 bb.note("Could not list remote: %s" % str(e))
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500770 return pupver
771
772 verstring = ""
773 revision = ""
774 for line in output.split("\n"):
775 if not line:
776 break
777
778 tag_head = line.split("/")[-1]
779 # Ignore non-released branches
Brad Bishop19323692019-04-05 15:28:33 -0400780 m = re.search(r"(alpha|beta|rc|final)+", tag_head)
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500781 if m:
782 continue
783
784 # search for version in the line
785 tag = tagregex.search(tag_head)
Andrew Geissler82c905d2020-04-13 13:39:40 -0500786 if tag is None:
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500787 continue
788
789 tag = tag.group('pver')
790 tag = tag.replace("_", ".")
791
792 if verstring and bb.utils.vercmp(("0", tag, ""), ("0", verstring, "")) < 0:
793 continue
794
795 verstring = tag
796 revision = line.split()[0]
797 pupver = (verstring, revision)
798
799 return pupver
800
801 def _build_revision(self, ud, d, name):
802 return ud.revisions[name]
803
804 def gitpkgv_revision(self, ud, d, name):
805 """
806 Return a sortable revision number by counting commits in the history
807 Based on gitpkgv.bblass in meta-openembedded
808 """
809 rev = self._build_revision(ud, d, name)
810 localpath = ud.localpath
811 rev_file = os.path.join(localpath, "oe-gitpkgv_" + rev)
812 if not os.path.exists(localpath):
813 commits = None
814 else:
815 if not os.path.exists(rev_file) or not os.path.getsize(rev_file):
816 from pipes import quote
817 commits = bb.fetch2.runfetchcmd(
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500818 "git rev-list %s -- | wc -l" % quote(rev),
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500819 d, quiet=True).strip().lstrip('0')
820 if commits:
821 open(rev_file, "w").write("%d\n" % int(commits))
822 else:
823 commits = open(rev_file, "r").readline(128).strip()
824 if commits:
825 return False, "%s+%s" % (commits, rev[:7])
826 else:
827 return True, str(rev)
828
829 def checkstatus(self, fetch, ud, d):
830 try:
831 self._lsremote(ud, d, "")
832 return True
Brad Bishop6e60e8b2018-02-01 10:27:11 -0500833 except bb.fetch2.FetchError:
Patrick Williamsc124f4f2015-09-15 14:41:29 -0500834 return False