| #!/usr/bin/env python3 | 
 | # ex:ts=4:sw=4:sts=4:et | 
 | # -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*- | 
 | # | 
 | # Copyright 2011 Intel Corporation | 
 | # Authored-by:  Yu Ke <ke.yu@intel.com> | 
 | #               Paul Eggleton <paul.eggleton@intel.com> | 
 | #               Richard Purdie <richard.purdie@intel.com> | 
 | # | 
 | # This program is free software; you can redistribute it and/or modify | 
 | # it under the terms of the GNU General Public License version 2 as | 
 | # published by the Free Software Foundation. | 
 | # | 
 | # This program is distributed in the hope that it will be useful, | 
 | # but WITHOUT ANY WARRANTY; without even the implied warranty of | 
 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
 | # GNU General Public License for more details. | 
 | # | 
 | # You should have received a copy of the GNU General Public License along | 
 | # with this program; if not, write to the Free Software Foundation, Inc., | 
 | # 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. | 
 |  | 
 | import fnmatch | 
 | import os, sys | 
 | import optparse | 
 | import logging | 
 | import subprocess | 
 | import tempfile | 
 | import configparser | 
 | import re | 
 | import copy | 
 | import pipes | 
 | import shutil | 
 | from collections import OrderedDict | 
 | from string import Template | 
 | from functools import reduce | 
 |  | 
 | __version__ = "0.2.1" | 
 |  | 
 | def logger_create(): | 
 |     logger = logging.getLogger("") | 
 |     loggerhandler = logging.StreamHandler() | 
 |     loggerhandler.setFormatter(logging.Formatter("[%(asctime)s] %(message)s","%H:%M:%S")) | 
 |     logger.addHandler(loggerhandler) | 
 |     logger.setLevel(logging.INFO) | 
 |     return logger | 
 |  | 
 | logger = logger_create() | 
 |  | 
 | def get_current_branch(repodir=None): | 
 |     try: | 
 |         if not os.path.exists(os.path.join(repodir if repodir else '', ".git")): | 
 |             # Repo not created yet (i.e. during init) so just assume master | 
 |             return "master" | 
 |         branchname = runcmd("git symbolic-ref HEAD 2>/dev/null", repodir).strip() | 
 |         if branchname.startswith("refs/heads/"): | 
 |             branchname = branchname[11:] | 
 |         return branchname | 
 |     except subprocess.CalledProcessError: | 
 |         return "" | 
 |  | 
 | class Configuration(object): | 
 |     """ | 
 |     Manages the configuration | 
 |  | 
 |     For an example config file, see combo-layer.conf.example | 
 |  | 
 |     """ | 
 |     def __init__(self, options): | 
 |         for key, val in options.__dict__.items(): | 
 |             setattr(self, key, val) | 
 |  | 
 |         def readsection(parser, section, repo): | 
 |             for (name, value) in parser.items(section): | 
 |                 if value.startswith("@"): | 
 |                     self.repos[repo][name] = eval(value.strip("@")) | 
 |                 else: | 
 |                     # Apply special type transformations for some properties. | 
 |                     # Type matches the RawConfigParser.get*() methods. | 
 |                     types = {'signoff': 'boolean', 'update': 'boolean', 'history': 'boolean'} | 
 |                     if name in types: | 
 |                         value = getattr(parser, 'get' + types[name])(section, name) | 
 |                     self.repos[repo][name] = value | 
 |  | 
 |         def readglobalsection(parser, section): | 
 |             for (name, value) in parser.items(section): | 
 |                 if name == "commit_msg": | 
 |                     self.commit_msg_template = value | 
 |  | 
 |         logger.debug("Loading config file %s" % self.conffile) | 
 |         self.parser = configparser.ConfigParser() | 
 |         with open(self.conffile) as f: | 
 |             self.parser.readfp(f) | 
 |  | 
 |         # initialize default values | 
 |         self.commit_msg_template = "Automatic commit to update last_revision" | 
 |  | 
 |         self.repos = {} | 
 |         for repo in self.parser.sections(): | 
 |             if repo == "combo-layer-settings": | 
 |                 # special handling for global settings | 
 |                 readglobalsection(self.parser, repo) | 
 |             else: | 
 |                 self.repos[repo] = {} | 
 |                 readsection(self.parser, repo, repo) | 
 |  | 
 |         # Load local configuration, if available | 
 |         self.localconffile = None | 
 |         self.localparser = None | 
 |         self.combobranch = None | 
 |         if self.conffile.endswith('.conf'): | 
 |             lcfile = self.conffile.replace('.conf', '-local.conf') | 
 |             if os.path.exists(lcfile): | 
 |                 # Read combo layer branch | 
 |                 self.combobranch = get_current_branch() | 
 |                 logger.debug("Combo layer branch is %s" % self.combobranch) | 
 |  | 
 |                 self.localconffile = lcfile | 
 |                 logger.debug("Loading local config file %s" % self.localconffile) | 
 |                 self.localparser = configparser.ConfigParser() | 
 |                 with open(self.localconffile) as f: | 
 |                     self.localparser.readfp(f) | 
 |  | 
 |                 for section in self.localparser.sections(): | 
 |                     if '|' in section: | 
 |                         sectionvals = section.split('|') | 
 |                         repo = sectionvals[0] | 
 |                         if sectionvals[1] != self.combobranch: | 
 |                             continue | 
 |                     else: | 
 |                         repo = section | 
 |                     if repo in self.repos: | 
 |                         readsection(self.localparser, section, repo) | 
 |  | 
 |     def update(self, repo, option, value, initmode=False): | 
 |         # If the main config has the option already, that is what we | 
 |         # are expected to modify. | 
 |         if self.localparser and not self.parser.has_option(repo, option): | 
 |             parser = self.localparser | 
 |             section = "%s|%s" % (repo, self.combobranch) | 
 |             conffile = self.localconffile | 
 |             if initmode and not parser.has_section(section): | 
 |                 parser.add_section(section) | 
 |         else: | 
 |             parser = self.parser | 
 |             section = repo | 
 |             conffile = self.conffile | 
 |         parser.set(section, option, value) | 
 |         with open(conffile, "w") as f: | 
 |             parser.write(f) | 
 |         self.repos[repo][option] = value | 
 |  | 
 |     def sanity_check(self, initmode=False): | 
 |         required_options=["src_uri", "local_repo_dir", "dest_dir", "last_revision"] | 
 |         if initmode: | 
 |             required_options.remove("last_revision") | 
 |         msg = "" | 
 |         missing_options = [] | 
 |         for name in self.repos: | 
 |             for option in required_options: | 
 |                 if option not in self.repos[name]: | 
 |                     msg = "%s\nOption %s is not defined for component %s" %(msg, option, name) | 
 |                     missing_options.append(option) | 
 |             # Sanitize dest_dir so that we do not have to deal with edge cases | 
 |             # (unset, empty string, double slashes) in the rest of the code. | 
 |             # It not being set will still be flagged as error because it is | 
 |             # listed as required option above; that could be changed now. | 
 |             dest_dir = os.path.normpath(self.repos[name].get("dest_dir", ".")) | 
 |             self.repos[name]["dest_dir"] = "." if not dest_dir else dest_dir | 
 |         if msg != "": | 
 |             logger.error("configuration file %s has the following error: %s" % (self.conffile,msg)) | 
 |             if self.localconffile and 'last_revision' in missing_options: | 
 |                 logger.error("local configuration file %s may be missing configuration for combo branch %s" % (self.localconffile, self.combobranch)) | 
 |             sys.exit(1) | 
 |  | 
 |         # filterdiff is required by action_splitpatch, so check its availability | 
 |         if subprocess.call("which filterdiff > /dev/null 2>&1", shell=True) != 0: | 
 |             logger.error("ERROR: patchutils package is missing, please install it (e.g. # apt-get install patchutils)") | 
 |             sys.exit(1) | 
 |  | 
 | def runcmd(cmd,destdir=None,printerr=True,out=None,env=None): | 
 |     """ | 
 |         execute command, raise CalledProcessError if fail | 
 |         return output if succeed | 
 |     """ | 
 |     logger.debug("run cmd '%s' in %s" % (cmd, os.getcwd() if destdir is None else destdir)) | 
 |     if not out: | 
 |         out = tempfile.TemporaryFile() | 
 |         err = out | 
 |     else: | 
 |         err = tempfile.TemporaryFile() | 
 |     try: | 
 |         subprocess.check_call(cmd, stdout=out, stderr=err, cwd=destdir, shell=isinstance(cmd, str), env=env or os.environ) | 
 |     except subprocess.CalledProcessError as e: | 
 |         err.seek(0) | 
 |         if printerr: | 
 |             logger.error("%s" % err.read()) | 
 |         raise e | 
 |  | 
 |     err.seek(0) | 
 |     output = err.read().decode('utf-8') | 
 |     logger.debug("output: %s" % output.replace(chr(0), '\\0')) | 
 |     return output | 
 |  | 
 | def action_init(conf, args): | 
 |     """ | 
 |         Clone component repositories | 
 |         Check git is initialised; if not, copy initial data from component repos | 
 |     """ | 
 |     for name in conf.repos: | 
 |         ldir = conf.repos[name]['local_repo_dir'] | 
 |         if not os.path.exists(ldir): | 
 |             logger.info("cloning %s to %s" %(conf.repos[name]['src_uri'], ldir)) | 
 |             subprocess.check_call("git clone %s %s" % (conf.repos[name]['src_uri'], ldir), shell=True) | 
 |     if not os.path.exists(".git"): | 
 |         runcmd("git init") | 
 |         if conf.history: | 
 |             # Need a common ref for all trees. | 
 |             runcmd('git commit -m "initial empty commit" --allow-empty') | 
 |             startrev = runcmd('git rev-parse master').strip() | 
 |  | 
 |         for name in conf.repos: | 
 |             repo = conf.repos[name] | 
 |             ldir = repo['local_repo_dir'] | 
 |             branch = repo.get('branch', "master") | 
 |             lastrev = repo.get('last_revision', None) | 
 |             if lastrev and lastrev != "HEAD": | 
 |                 initialrev = lastrev | 
 |                 if branch: | 
 |                     if not check_rev_branch(name, ldir, lastrev, branch): | 
 |                         sys.exit(1) | 
 |                 logger.info("Copying data from %s at specified revision %s..." % (name, lastrev)) | 
 |             else: | 
 |                 lastrev = None | 
 |                 initialrev = branch | 
 |                 logger.info("Copying data from %s..." % name) | 
 |             # Sanity check initialrev and turn it into hash (required for copying history, | 
 |             # because resolving a name ref only works in the component repo). | 
 |             rev = runcmd('git rev-parse %s' % initialrev, ldir).strip() | 
 |             if rev != initialrev: | 
 |                 try: | 
 |                     refs = runcmd('git show-ref -s %s' % initialrev, ldir).split('\n') | 
 |                     if len(set(refs)) > 1: | 
 |                         # Happens for example when configured to track | 
 |                         # "master" and there is a refs/heads/master. The | 
 |                         # traditional behavior from "git archive" (preserved | 
 |                         # here) it to choose the first one. This might not be | 
 |                         # intended, so at least warn about it. | 
 |                         logger.warn("%s: initial revision '%s' not unique, picking result of rev-parse = %s" % | 
 |                                     (name, initialrev, refs[0])) | 
 |                         initialrev = rev | 
 |                 except: | 
 |                     # show-ref fails for hashes. Skip the sanity warning in that case. | 
 |                     pass | 
 |                 initialrev = rev | 
 |             dest_dir = repo['dest_dir'] | 
 |             if dest_dir != ".": | 
 |                 extract_dir = os.path.join(os.getcwd(), dest_dir) | 
 |                 if not os.path.exists(extract_dir): | 
 |                     os.makedirs(extract_dir) | 
 |             else: | 
 |                 extract_dir = os.getcwd() | 
 |             file_filter = repo.get('file_filter', "") | 
 |             exclude_patterns = repo.get('file_exclude', '').split() | 
 |             def copy_selected_files(initialrev, extract_dir, file_filter, exclude_patterns, ldir, | 
 |                                     subdir=""): | 
 |                 # When working inside a filtered branch which had the | 
 |                 # files already moved, we need to prepend the | 
 |                 # subdirectory to all filters, otherwise they would | 
 |                 # not match. | 
 |                 if subdir == '.': | 
 |                     subdir = '' | 
 |                 elif subdir: | 
 |                     subdir = os.path.normpath(subdir) | 
 |                     file_filter = ' '.join([subdir + '/' + x for x in file_filter.split()]) | 
 |                     exclude_patterns = [subdir + '/' + x for x in exclude_patterns] | 
 |                 # To handle both cases, we cd into the target | 
 |                 # directory and optionally tell tar to strip the path | 
 |                 # prefix when the files were already moved. | 
 |                 subdir_components = len(subdir.split(os.path.sep)) if subdir else 0 | 
 |                 strip=('--strip-components=%d' % subdir_components) if subdir else '' | 
 |                 # TODO: file_filter wild cards do not work (and haven't worked before either), because | 
 |                 # a) GNU tar requires a --wildcards parameter before turning on wild card matching. | 
 |                 # b) The semantic is not as intendend (src/*.c also matches src/foo/bar.c, | 
 |                 #    in contrast to the other use of file_filter as parameter of "git archive" | 
 |                 #    where it only matches .c files directly in src). | 
 |                 files = runcmd("git archive %s %s | tar -x -v %s -C %s %s" % | 
 |                                (initialrev, subdir, | 
 |                                 strip, extract_dir, file_filter), | 
 |                                ldir) | 
 |                 if exclude_patterns: | 
 |                     # Implement file removal by letting tar create the | 
 |                     # file and then deleting it in the file system | 
 |                     # again. Uses the list of files created by tar (easier | 
 |                     # than walking the tree). | 
 |                     for file in files.split('\n'): | 
 |                         for pattern in exclude_patterns: | 
 |                             if fnmatch.fnmatch(file, pattern): | 
 |                                 os.unlink(os.path.join(*([extract_dir] + ['..'] * subdir_components + [file]))) | 
 |                                 break | 
 |  | 
 |             if not conf.history: | 
 |                 copy_selected_files(initialrev, extract_dir, file_filter, exclude_patterns, ldir) | 
 |             else: | 
 |                 # First fetch remote history into local repository. | 
 |                 # We need a ref for that, so ensure that there is one. | 
 |                 refname = "combo-layer-init-%s" % name | 
 |                 runcmd("git branch -f %s %s" % (refname, initialrev), ldir) | 
 |                 runcmd("git fetch %s %s" % (ldir, refname)) | 
 |                 runcmd("git branch -D %s" % refname, ldir) | 
 |                 # Make that the head revision. | 
 |                 runcmd("git checkout -b %s %s" % (name, initialrev)) | 
 |                 # Optional: cut the history by replacing the given | 
 |                 # start point(s) with commits providing the same | 
 |                 # content (aka tree), but with commit information that | 
 |                 # makes it clear that this is an artifically created | 
 |                 # commit and nothing the original authors had anything | 
 |                 # to do with. | 
 |                 since_rev = repo.get('since_revision', '') | 
 |                 if since_rev: | 
 |                     committer = runcmd('git var GIT_AUTHOR_IDENT').strip() | 
 |                     # Same time stamp, no name. | 
 |                     author = re.sub('.* (\d+ [+-]\d+)', r'unknown <unknown> \1', committer) | 
 |                     logger.info('author %s' % author) | 
 |                     for rev in since_rev.split(): | 
 |                         # Resolve in component repo... | 
 |                         rev = runcmd('git log --oneline --no-abbrev-commit -n1 %s' % rev, ldir).split()[0] | 
 |                         # ... and then get the tree in current | 
 |                         # one. The commit should be in both repos with | 
 |                         # the same tree, but better check here. | 
 |                         tree = runcmd('git show -s --pretty=format:%%T %s' % rev).strip() | 
 |                         with tempfile.NamedTemporaryFile() as editor: | 
 |                             editor.write('''cat >$1 <<EOF | 
 | tree %s | 
 | author %s | 
 | committer %s | 
 |  | 
 | %s: squashed import of component | 
 |  | 
 | This commit copies the entire set of files as found in | 
 | %s %s | 
 |  | 
 | For more information about previous commits, see the | 
 | upstream repository. | 
 |  | 
 | Commit created by combo-layer. | 
 | EOF | 
 | ''' % (tree, author, committer, name, name, since_rev)) | 
 |                             editor.flush() | 
 |                             os.environ['GIT_EDITOR'] = 'sh %s' % editor.name | 
 |                             runcmd('git replace --edit %s' % rev) | 
 |  | 
 |                 # Optional: rewrite history to change commit messages or to move files. | 
 |                 if 'hook' in repo or dest_dir != ".": | 
 |                     filter_branch = ['git', 'filter-branch', '--force'] | 
 |                     with tempfile.NamedTemporaryFile() as hookwrapper: | 
 |                         if 'hook' in repo: | 
 |                             # Create a shell script wrapper around the original hook that | 
 |                             # can be used by git filter-branch. Hook may or may not have | 
 |                             # an absolute path. | 
 |                             hook = repo['hook'] | 
 |                             hook = os.path.join(os.path.dirname(conf.conffile), '..', hook) | 
 |                             # The wrappers turns the commit message | 
 |                             # from stdin into a fake patch header. | 
 |                             # This is good enough for changing Subject | 
 |                             # and commit msg body with normal | 
 |                             # combo-layer hooks. | 
 |                             hookwrapper.write('''set -e | 
 | tmpname=$(mktemp) | 
 | trap "rm $tmpname" EXIT | 
 | echo -n 'Subject: [PATCH] ' >>$tmpname | 
 | cat >>$tmpname | 
 | if ! [ $(tail -c 1 $tmpname | od -A n -t x1) == '0a' ]; then | 
 |     echo >>$tmpname | 
 | fi | 
 | echo '---' >>$tmpname | 
 | %s $tmpname $GIT_COMMIT %s | 
 | tail -c +18 $tmpname | head -c -4 | 
 | ''' % (hook, name)) | 
 |                             hookwrapper.flush() | 
 |                             filter_branch.extend(['--msg-filter', 'bash %s' % hookwrapper.name]) | 
 |                         if dest_dir != ".": | 
 |                             parent = os.path.dirname(dest_dir) | 
 |                             if not parent: | 
 |                                 parent = '.' | 
 |                             # May run outside of the current directory, so do not assume that .git exists. | 
 |                             filter_branch.extend(['--tree-filter', 'mkdir -p .git/tmptree && find . -mindepth 1 -maxdepth 1 ! -name .git -print0 | xargs -0 -I SOURCE mv SOURCE .git/tmptree && mkdir -p %s && mv .git/tmptree %s' % (parent, dest_dir)]) | 
 |                         filter_branch.append('HEAD') | 
 |                         runcmd(filter_branch) | 
 |                         runcmd('git update-ref -d refs/original/refs/heads/%s' % name) | 
 |                 repo['rewritten_revision'] = runcmd('git rev-parse HEAD').strip() | 
 |                 repo['stripped_revision'] = repo['rewritten_revision'] | 
 |                 # Optional filter files: remove everything and re-populate using the normal filtering code. | 
 |                 # Override any potential .gitignore. | 
 |                 if file_filter or exclude_patterns: | 
 |                     runcmd('git rm -rf .') | 
 |                     if not os.path.exists(extract_dir): | 
 |                         os.makedirs(extract_dir) | 
 |                     copy_selected_files('HEAD', extract_dir, file_filter, exclude_patterns, '.', | 
 |                                         subdir=dest_dir) | 
 |                     runcmd('git add --all --force .') | 
 |                     if runcmd('git status --porcelain'): | 
 |                         # Something to commit. | 
 |                         runcmd(['git', 'commit', '-m', | 
 |                                 '''%s: select file subset | 
 |  | 
 | Files from the component repository were chosen based on | 
 | the following filters: | 
 | file_filter = %s | 
 | file_exclude = %s''' % (name, file_filter or '<empty>', repo.get('file_exclude', '<empty>'))]) | 
 |                         repo['stripped_revision'] = runcmd('git rev-parse HEAD').strip() | 
 |  | 
 |             if not lastrev: | 
 |                 lastrev = runcmd('git rev-parse %s' % initialrev, ldir).strip() | 
 |                 conf.update(name, "last_revision", lastrev, initmode=True) | 
 |  | 
 |         if not conf.history: | 
 |             runcmd("git add .") | 
 |         else: | 
 |             # Create Octopus merge commit according to http://stackoverflow.com/questions/10874149/git-octopus-merge-with-unrelated-repositoies | 
 |             runcmd('git checkout master') | 
 |             merge = ['git', 'merge', '--no-commit'] | 
 |             for name in conf.repos: | 
 |                 repo = conf.repos[name] | 
 |                 # Use branch created earlier. | 
 |                 merge.append(name) | 
 |                 # Root all commits which have no parent in the common | 
 |                 # ancestor in the new repository. | 
 |                 for start in runcmd('git log --pretty=format:%%H --max-parents=0 %s' % name).split('\n'): | 
 |                     runcmd('git replace --graft %s %s' % (start, startrev)) | 
 |             try: | 
 |                 runcmd(merge) | 
 |             except Exception as error: | 
 |                 logger.info('''Merging component repository history failed, perhaps because of merge conflicts. | 
 | It may be possible to commit anyway after resolving these conflicts. | 
 |  | 
 | %s''' % error) | 
 |             # Create MERGE_HEAD and MERGE_MSG. "git merge" itself | 
 |             # does not create MERGE_HEAD in case of a (harmless) failure, | 
 |             # and we want certain auto-generated information in the | 
 |             # commit message for future reference and/or automation. | 
 |             with open('.git/MERGE_HEAD', 'w') as head: | 
 |                 with open('.git/MERGE_MSG', 'w') as msg: | 
 |                     msg.write('repo: initial import of components\n\n') | 
 |                     # head.write('%s\n' % startrev) | 
 |                     for name in conf.repos: | 
 |                         repo = conf.repos[name] | 
 |                         # <upstream ref> <rewritten ref> <rewritten + files removed> | 
 |                         msg.write('combo-layer-%s: %s %s %s\n' % (name, | 
 |                                                                   repo['last_revision'], | 
 |                                                                   repo['rewritten_revision'], | 
 |                                                                   repo['stripped_revision'])) | 
 |                         rev = runcmd('git rev-parse %s' % name).strip() | 
 |                         head.write('%s\n' % rev) | 
 |  | 
 |         if conf.localconffile: | 
 |             localadded = True | 
 |             try: | 
 |                 runcmd("git rm --cached %s" % conf.localconffile, printerr=False) | 
 |             except subprocess.CalledProcessError: | 
 |                 localadded = False | 
 |             if localadded: | 
 |                 localrelpath = os.path.relpath(conf.localconffile) | 
 |                 runcmd("grep -q %s .gitignore || echo %s >> .gitignore" % (localrelpath, localrelpath)) | 
 |                 runcmd("git add .gitignore") | 
 |                 logger.info("Added local configuration file %s to .gitignore", localrelpath) | 
 |         logger.info("Initial combo layer repository data has been created; please make any changes if desired and then use 'git commit' to make the initial commit.") | 
 |     else: | 
 |         logger.info("Repository already initialised, nothing to do.") | 
 |  | 
 |  | 
 | def check_repo_clean(repodir): | 
 |     """ | 
 |         check if the repo is clean | 
 |         exit if repo is dirty | 
 |     """ | 
 |     output=runcmd("git status --porcelain", repodir) | 
 |     r = re.compile('\?\? patch-.*/') | 
 |     dirtyout = [item for item in output.splitlines() if not r.match(item)] | 
 |     if dirtyout: | 
 |         logger.error("git repo %s is dirty, please fix it first", repodir) | 
 |         sys.exit(1) | 
 |  | 
 | def check_patch(patchfile): | 
 |     f = open(patchfile, 'rb') | 
 |     ln = f.readline() | 
 |     of = None | 
 |     in_patch = False | 
 |     beyond_msg = False | 
 |     pre_buf = b'' | 
 |     while ln: | 
 |         if not beyond_msg: | 
 |             if ln == b'---\n': | 
 |                 if not of: | 
 |                     break | 
 |                 in_patch = False | 
 |                 beyond_msg = True | 
 |             elif ln.startswith(b'--- '): | 
 |                 # We have a diff in the commit message | 
 |                 in_patch = True | 
 |                 if not of: | 
 |                     print('WARNING: %s contains a diff in its commit message, indenting to avoid failure during apply' % patchfile) | 
 |                     of = open(patchfile + '.tmp', 'wb') | 
 |                     of.write(pre_buf) | 
 |                     pre_buf = b'' | 
 |             elif in_patch and not ln[0] in b'+-@ \n\r': | 
 |                 in_patch = False | 
 |         if of: | 
 |             if in_patch: | 
 |                 of.write(b' ' + ln) | 
 |             else: | 
 |                 of.write(ln) | 
 |         else: | 
 |             pre_buf += ln | 
 |         ln = f.readline() | 
 |     f.close() | 
 |     if of: | 
 |         of.close() | 
 |         os.rename(patchfile + '.tmp', patchfile) | 
 |  | 
 | def drop_to_shell(workdir=None): | 
 |     if not sys.stdin.isatty(): | 
 |         print("Not a TTY so can't drop to shell for resolution, exiting.") | 
 |         return False | 
 |  | 
 |     shell = os.environ.get('SHELL', 'bash') | 
 |     print('Dropping to shell "%s"\n' \ | 
 |           'When you are finished, run the following to continue:\n' \ | 
 |           '       exit    -- continue to apply the patches\n' \ | 
 |           '       exit 1  -- abort\n' % shell); | 
 |     ret = subprocess.call([shell], cwd=workdir) | 
 |     if ret != 0: | 
 |         print("Aborting") | 
 |         return False | 
 |     else: | 
 |         return True | 
 |  | 
 | def check_rev_branch(component, repodir, rev, branch): | 
 |     try: | 
 |         actualbranch = runcmd("git branch --contains %s" % rev, repodir, printerr=False) | 
 |     except subprocess.CalledProcessError as e: | 
 |         if e.returncode == 129: | 
 |             actualbranch = "" | 
 |         else: | 
 |             raise | 
 |  | 
 |     if not actualbranch: | 
 |         logger.error("%s: specified revision %s is invalid!" % (component, rev)) | 
 |         return False | 
 |  | 
 |     branches = [] | 
 |     branchlist = actualbranch.split("\n") | 
 |     for b in branchlist: | 
 |         branches.append(b.strip().split(' ')[-1]) | 
 |  | 
 |     if branch not in branches: | 
 |         logger.error("%s: specified revision %s is not on specified branch %s!" % (component, rev, branch)) | 
 |         return False | 
 |     return True | 
 |  | 
 | def get_repos(conf, repo_names): | 
 |     repos = [] | 
 |     for name in repo_names: | 
 |         if name.startswith('-'): | 
 |             break | 
 |         else: | 
 |             repos.append(name) | 
 |     for repo in repos: | 
 |         if not repo in conf.repos: | 
 |             logger.error("Specified component '%s' not found in configuration" % repo) | 
 |             sys.exit(1) | 
 |  | 
 |     if not repos: | 
 |         repos = [ repo for repo in conf.repos if conf.repos[repo].get("update", True) ] | 
 |  | 
 |     return repos | 
 |  | 
 | def action_pull(conf, args): | 
 |     """ | 
 |         update the component repos only | 
 |     """ | 
 |     repos = get_repos(conf, args[1:]) | 
 |  | 
 |     # make sure all repos are clean | 
 |     for name in repos: | 
 |         check_repo_clean(conf.repos[name]['local_repo_dir']) | 
 |  | 
 |     for name in repos: | 
 |         repo = conf.repos[name] | 
 |         ldir = repo['local_repo_dir'] | 
 |         branch = repo.get('branch', "master") | 
 |         logger.info("update branch %s of component repo %s in %s ..." % (branch, name, ldir)) | 
 |         if not conf.hard_reset: | 
 |             # Try to pull only the configured branch. Beware that this may fail | 
 |             # when the branch is currently unknown (for example, after reconfiguring | 
 |             # combo-layer). In that case we need to fetch everything and try the check out | 
 |             # and pull again. | 
 |             try: | 
 |                 runcmd("git checkout %s" % branch, ldir, printerr=False) | 
 |             except subprocess.CalledProcessError: | 
 |                 output=runcmd("git fetch", ldir) | 
 |                 logger.info(output) | 
 |                 runcmd("git checkout %s" % branch, ldir) | 
 |                 runcmd("git pull --ff-only", ldir) | 
 |             else: | 
 |                 output=runcmd("git pull --ff-only", ldir) | 
 |                 logger.info(output) | 
 |         else: | 
 |             output=runcmd("git fetch", ldir) | 
 |             logger.info(output) | 
 |             runcmd("git checkout %s" % branch, ldir) | 
 |             runcmd("git reset --hard FETCH_HEAD", ldir) | 
 |  | 
 | def action_update(conf, args): | 
 |     """ | 
 |         update the component repos | 
 |         either: | 
 |            generate the patch list | 
 |            apply the generated patches | 
 |         or: | 
 |            re-creates the entire component history and merges them | 
 |            into the current branch with a merge commit | 
 |     """ | 
 |     components = [arg.split(':')[0] for arg in args[1:]] | 
 |     revisions = {} | 
 |     for arg in args[1:]: | 
 |         if ':' in arg: | 
 |             a = arg.split(':', 1) | 
 |             revisions[a[0]] = a[1] | 
 |     repos = get_repos(conf, components) | 
 |  | 
 |     # make sure combo repo is clean | 
 |     check_repo_clean(os.getcwd()) | 
 |  | 
 |     # Check whether we keep the component histories. Must be | 
 |     # set either via --history command line parameter or consistently | 
 |     # in combo-layer.conf. Mixing modes is (currently, and probably | 
 |     # permanently because it would be complicated) not supported. | 
 |     if conf.history: | 
 |         history = True | 
 |     else: | 
 |         history = None | 
 |         for name in repos: | 
 |             repo = conf.repos[name] | 
 |             repo_history = repo.get('history', False) | 
 |             if history is None: | 
 |                 history = repo_history | 
 |             elif history != repo_history: | 
 |                 logger.error("'history' property is set inconsistently") | 
 |                 sys.exit(1) | 
 |  | 
 |     # Step 1: update the component repos | 
 |     if conf.nopull: | 
 |         logger.info("Skipping pull (-n)") | 
 |     else: | 
 |         action_pull(conf, ['arg0'] + components) | 
 |  | 
 |     if history: | 
 |         update_with_history(conf, components, revisions, repos) | 
 |     else: | 
 |         update_with_patches(conf, components, revisions, repos) | 
 |  | 
 | def update_with_patches(conf, components, revisions, repos): | 
 |     import uuid | 
 |     patch_dir = "patch-%s" % uuid.uuid4() | 
 |     if not os.path.exists(patch_dir): | 
 |         os.mkdir(patch_dir) | 
 |  | 
 |     for name in repos: | 
 |         revision = revisions.get(name, None) | 
 |         repo = conf.repos[name] | 
 |         ldir = repo['local_repo_dir'] | 
 |         dest_dir = repo['dest_dir'] | 
 |         branch = repo.get('branch', "master") | 
 |         repo_patch_dir = os.path.join(os.getcwd(), patch_dir, name) | 
 |  | 
 |         # Step 2: generate the patch list and store to patch dir | 
 |         logger.info("Generating patches from %s..." % name) | 
 |         top_revision = revision or branch | 
 |         if not check_rev_branch(name, ldir, top_revision, branch): | 
 |             sys.exit(1) | 
 |         if dest_dir != ".": | 
 |             prefix = "--src-prefix=a/%s/ --dst-prefix=b/%s/" % (dest_dir, dest_dir) | 
 |         else: | 
 |             prefix = "" | 
 |         if repo['last_revision'] == "": | 
 |             logger.info("Warning: last_revision of component %s is not set, starting from the first commit" % name) | 
 |             patch_cmd_range = "--root %s" % top_revision | 
 |             rev_cmd_range = top_revision | 
 |         else: | 
 |             if not check_rev_branch(name, ldir, repo['last_revision'], branch): | 
 |                 sys.exit(1) | 
 |             patch_cmd_range = "%s..%s" % (repo['last_revision'], top_revision) | 
 |             rev_cmd_range = patch_cmd_range | 
 |  | 
 |         file_filter = repo.get('file_filter',".") | 
 |  | 
 |         # Filter out unwanted files | 
 |         exclude = repo.get('file_exclude', '') | 
 |         if exclude: | 
 |             for path in exclude.split(): | 
 |                 p = "%s/%s" % (dest_dir, path) if dest_dir != '.' else path | 
 |                 file_filter += " ':!%s'" % p | 
 |  | 
 |         patch_cmd = "git format-patch -N %s --output-directory %s %s -- %s" % \ | 
 |             (prefix,repo_patch_dir, patch_cmd_range, file_filter) | 
 |         output = runcmd(patch_cmd, ldir) | 
 |         logger.debug("generated patch set:\n%s" % output) | 
 |         patchlist = output.splitlines() | 
 |  | 
 |         rev_cmd = "git rev-list --no-merges %s -- %s" % (rev_cmd_range, file_filter) | 
 |         revlist = runcmd(rev_cmd, ldir).splitlines() | 
 |  | 
 |         # Step 3: Call repo specific hook to adjust patch | 
 |         if 'hook' in repo: | 
 |             # hook parameter is: ./hook patchpath revision reponame | 
 |             count=len(revlist)-1 | 
 |             for patch in patchlist: | 
 |                 runcmd("%s %s %s %s" % (repo['hook'], patch, revlist[count], name)) | 
 |                 count=count-1 | 
 |  | 
 |         # Step 4: write patch list and revision list to file, for user to edit later | 
 |         patchlist_file = os.path.join(os.getcwd(), patch_dir, "patchlist-%s" % name) | 
 |         repo['patchlist'] = patchlist_file | 
 |         f = open(patchlist_file, 'w') | 
 |         count=len(revlist)-1 | 
 |         for patch in patchlist: | 
 |             f.write("%s %s\n" % (patch, revlist[count])) | 
 |             check_patch(os.path.join(patch_dir, patch)) | 
 |             count=count-1 | 
 |         f.close() | 
 |  | 
 |     # Step 5: invoke bash for user to edit patch and patch list | 
 |     if conf.interactive: | 
 |         print('You may now edit the patch and patch list in %s\n' \ | 
 |               'For example, you can remove unwanted patch entries from patchlist-*, so that they will be not applied later' % patch_dir); | 
 |         if not drop_to_shell(patch_dir): | 
 |             sys.exit(1) | 
 |  | 
 |     # Step 6: apply the generated and revised patch | 
 |     apply_patchlist(conf, repos) | 
 |     runcmd("rm -rf %s" % patch_dir) | 
 |  | 
 |     # Step 7: commit the updated config file if it's being tracked | 
 |     commit_conf_file(conf, components) | 
 |  | 
 | def conf_commit_msg(conf, components): | 
 |     # create the "components" string | 
 |     component_str = "all components" | 
 |     if len(components) > 0: | 
 |         # otherwise tell which components were actually changed | 
 |         component_str = ", ".join(components) | 
 |  | 
 |     # expand the template with known values | 
 |     template = Template(conf.commit_msg_template) | 
 |     msg = template.substitute(components = component_str) | 
 |     return msg | 
 |  | 
 | def commit_conf_file(conf, components, commit=True): | 
 |     relpath = os.path.relpath(conf.conffile) | 
 |     try: | 
 |         output = runcmd("git status --porcelain %s" % relpath, printerr=False) | 
 |     except: | 
 |         # Outside the repository | 
 |         output = None | 
 |     if output: | 
 |         if output.lstrip().startswith("M"): | 
 |             logger.info("Committing updated configuration file") | 
 |             if commit: | 
 |                 msg = conf_commit_msg(conf, components) | 
 |                 runcmd('git commit -m'.split() + [msg, relpath]) | 
 |             else: | 
 |                 runcmd('git add %s' % relpath) | 
 |             return True | 
 |     return False | 
 |  | 
 | def apply_patchlist(conf, repos): | 
 |     """ | 
 |         apply the generated patch list to combo repo | 
 |     """ | 
 |     for name in repos: | 
 |         repo = conf.repos[name] | 
 |         lastrev = repo["last_revision"] | 
 |         prevrev = lastrev | 
 |  | 
 |         # Get non-blank lines from patch list file | 
 |         patchlist = [] | 
 |         if os.path.exists(repo['patchlist']) or not conf.interactive: | 
 |             # Note: we want this to fail here if the file doesn't exist and we're not in | 
 |             # interactive mode since the file should exist in this case | 
 |             with open(repo['patchlist']) as f: | 
 |                 for line in f: | 
 |                     line = line.rstrip() | 
 |                     if line: | 
 |                         patchlist.append(line) | 
 |  | 
 |         ldir = conf.repos[name]['local_repo_dir'] | 
 |         branch = conf.repos[name].get('branch', "master") | 
 |         branchrev = runcmd("git rev-parse %s" % branch, ldir).strip() | 
 |  | 
 |         if patchlist: | 
 |             logger.info("Applying patches from %s..." % name) | 
 |             linecount = len(patchlist) | 
 |             i = 1 | 
 |             for line in patchlist: | 
 |                 patchfile = line.split()[0] | 
 |                 lastrev = line.split()[1] | 
 |                 patchdisp = os.path.relpath(patchfile) | 
 |                 if os.path.getsize(patchfile) == 0: | 
 |                     logger.info("(skipping %d/%d %s - no changes)" % (i, linecount, patchdisp)) | 
 |                 else: | 
 |                     cmd = "git am --keep-cr %s-p1 %s" % ('-s ' if repo.get('signoff', True) else '', patchfile) | 
 |                     logger.info("Applying %d/%d: %s" % (i, linecount, patchdisp)) | 
 |                     try: | 
 |                         runcmd(cmd) | 
 |                     except subprocess.CalledProcessError: | 
 |                         logger.info('Running "git am --abort" to cleanup repo') | 
 |                         runcmd("git am --abort") | 
 |                         logger.error('"%s" failed' % cmd) | 
 |                         logger.info("Please manually apply patch %s" % patchdisp) | 
 |                         logger.info("Note: if you exit and continue applying without manually applying the patch, it will be skipped") | 
 |                         if not drop_to_shell(): | 
 |                             if prevrev != repo['last_revision']: | 
 |                                 conf.update(name, "last_revision", prevrev) | 
 |                             sys.exit(1) | 
 |                 prevrev = lastrev | 
 |                 i += 1 | 
 |             # Once all patches are applied, we should update | 
 |             # last_revision to the branch head instead of the last | 
 |             # applied patch. The two are not necessarily the same when | 
 |             # the last commit is a merge commit or when the patches at | 
 |             # the branch head were intentionally excluded. | 
 |             # | 
 |             # If we do not do that for a merge commit, the next | 
 |             # combo-layer run will only exclude patches reachable from | 
 |             # one of the merged branches and try to re-apply patches | 
 |             # from other branches even though they were already | 
 |             # copied. | 
 |             # | 
 |             # If patches were intentionally excluded, the next run will | 
 |             # present them again instead of skipping over them. This | 
 |             # may or may not be intended, so the code here is conservative | 
 |             # and only addresses the "head is merge commit" case. | 
 |             if lastrev != branchrev and \ | 
 |                len(runcmd("git show --pretty=format:%%P --no-patch %s" % branch, ldir).split()) > 1: | 
 |                 lastrev = branchrev | 
 |         else: | 
 |             logger.info("No patches to apply from %s" % name) | 
 |             lastrev = branchrev | 
 |  | 
 |         if lastrev != repo['last_revision']: | 
 |             conf.update(name, "last_revision", lastrev) | 
 |  | 
 | def action_splitpatch(conf, args): | 
 |     """ | 
 |         generate the commit patch and | 
 |         split the patch per repo | 
 |     """ | 
 |     logger.debug("action_splitpatch") | 
 |     if len(args) > 1: | 
 |         commit = args[1] | 
 |     else: | 
 |         commit = "HEAD" | 
 |     patchdir = "splitpatch-%s" % commit | 
 |     if not os.path.exists(patchdir): | 
 |         os.mkdir(patchdir) | 
 |  | 
 |     # filerange_root is for the repo whose dest_dir is root "." | 
 |     # and it should be specified by excluding all other repo dest dir | 
 |     # like "-x repo1 -x repo2 -x repo3 ..." | 
 |     filerange_root = "" | 
 |     for name in conf.repos: | 
 |         dest_dir = conf.repos[name]['dest_dir'] | 
 |         if dest_dir != ".": | 
 |             filerange_root = '%s -x "%s/*"' % (filerange_root, dest_dir) | 
 |  | 
 |     for name in conf.repos: | 
 |         dest_dir = conf.repos[name]['dest_dir'] | 
 |         patch_filename = "%s/%s.patch" % (patchdir, name) | 
 |         if dest_dir == ".": | 
 |             cmd = "git format-patch -n1 --stdout %s^..%s | filterdiff -p1 %s > %s" % (commit, commit, filerange_root, patch_filename) | 
 |         else: | 
 |             cmd = "git format-patch --no-prefix -n1 --stdout %s^..%s -- %s > %s" % (commit, commit, dest_dir, patch_filename) | 
 |         runcmd(cmd) | 
 |         # Detect empty patches (including those produced by filterdiff above | 
 |         # that contain only preamble text) | 
 |         if os.path.getsize(patch_filename) == 0 or runcmd("filterdiff %s" % patch_filename) == "": | 
 |             os.remove(patch_filename) | 
 |             logger.info("(skipping %s - no changes)", name) | 
 |         else: | 
 |             logger.info(patch_filename) | 
 |  | 
 | def update_with_history(conf, components, revisions, repos): | 
 |     '''Update all components with full history. | 
 |  | 
 |     Works by importing all commits reachable from a component's | 
 |     current head revision.  If those commits are rooted in an already | 
 |     imported commit, their content gets mixed with the content of the | 
 |     combined repo of that commit (new or modified files overwritten, | 
 |     removed files removed). | 
 |  | 
 |     The last commit is an artificial merge commit that merges all the | 
 |     updated components into the combined repository. | 
 |  | 
 |     The HEAD ref only gets updated at the very end. All intermediate work | 
 |     happens in a worktree which will get garbage collected by git eventually | 
 |     after a failure. | 
 |     ''' | 
 |     # Remember current HEAD and what we need to add to it. | 
 |     head = runcmd("git rev-parse HEAD").strip() | 
 |     additional_heads = {} | 
 |  | 
 |     # Track the mapping between original commit and commit in the | 
 |     # combined repo. We do not have to distinguish between components, | 
 |     # because commit hashes are different anyway. Often we can | 
 |     # skip find_revs() entirely (for example, when all new commits | 
 |     # are derived from the last imported revision). | 
 |     # | 
 |     # Using "head" (typically the merge commit) instead of the actual | 
 |     # commit for the component leads to a nicer history in the combined | 
 |     # repo. | 
 |     old2new_revs = {} | 
 |     for name in repos: | 
 |         repo = conf.repos[name] | 
 |         revision = repo['last_revision'] | 
 |         if revision: | 
 |             old2new_revs[revision] = head | 
 |  | 
 |     def add_p(parents): | 
 |         '''Insert -p before each entry.''' | 
 |         parameters = [] | 
 |         for p in parents: | 
 |             parameters.append('-p') | 
 |             parameters.append(p) | 
 |         return parameters | 
 |  | 
 |     # Do all intermediate work with a separate work dir and index, | 
 |     # chosen via env variables (can't use "git worktree", it is too | 
 |     # new). This is useful (no changes to current work tree unless the | 
 |     # update succeeds) and required (otherwise we end up temporarily | 
 |     # removing the combo-layer hooks that we currently use when | 
 |     # importing a new component). | 
 |     # | 
 |     # Not cleaned up after a failure at the moment. | 
 |     wdir = os.path.join(os.getcwd(), ".git", "combo-layer") | 
 |     windex = wdir + ".index" | 
 |     if os.path.isdir(wdir): | 
 |         shutil.rmtree(wdir) | 
 |     os.mkdir(wdir) | 
 |     wenv = copy.deepcopy(os.environ) | 
 |     wenv["GIT_WORK_TREE"] = wdir | 
 |     wenv["GIT_INDEX_FILE"] = windex | 
 |     # This one turned out to be needed in practice. | 
 |     wenv["GIT_OBJECT_DIRECTORY"] = os.path.join(os.getcwd(), ".git", "objects") | 
 |     wargs = {"destdir": wdir, "env": wenv} | 
 |  | 
 |     for name in repos: | 
 |         revision = revisions.get(name, None) | 
 |         repo = conf.repos[name] | 
 |         ldir = repo['local_repo_dir'] | 
 |         dest_dir = repo['dest_dir'] | 
 |         branch = repo.get('branch', "master") | 
 |         hook = repo.get('hook', None) | 
 |         largs = {"destdir": ldir, "env": None} | 
 |         file_include = repo.get('file_filter', '').split() | 
 |         file_include.sort() # make sure that short entries like '.' come first. | 
 |         file_exclude = repo.get('file_exclude', '').split() | 
 |  | 
 |         def include_file(file): | 
 |             if not file_include: | 
 |                 # No explicit filter set, include file. | 
 |                 return True | 
 |             for filter in file_include: | 
 |                 if filter == '.': | 
 |                     # Another special case: include current directory and thus all files. | 
 |                     return True | 
 |                 if os.path.commonprefix((filter, file)) == filter: | 
 |                     # Included in directory or direct file match. | 
 |                     return True | 
 |                 # Check for wildcard match *with* allowing * to match /, i.e. | 
 |                 # src/*.c does match src/foobar/*.c. That's not how it is done elsewhere | 
 |                 # when passing the filtering to "git archive", but it is unclear what | 
 |                 # the intended semantic is (the comment on file_exclude that "append a * wildcard | 
 |                 # at the end" to match the full content of a directories implies that | 
 |                 # slashes are indeed not special), so here we simply do what's easy to | 
 |                 # implement in Python. | 
 |                 logger.debug('fnmatch(%s, %s)' % (file, filter)) | 
 |                 if fnmatch.fnmatchcase(file, filter): | 
 |                     return True | 
 |             return False | 
 |  | 
 |         def exclude_file(file): | 
 |             for filter in file_exclude: | 
 |                 if fnmatch.fnmatchcase(file, filter): | 
 |                     return True | 
 |             return False | 
 |  | 
 |         def file_filter(files): | 
 |             '''Clean up file list so that only included files remain.''' | 
 |             index = 0 | 
 |             while index < len(files): | 
 |                 file = files[index] | 
 |                 if not include_file(file) or exclude_file(file): | 
 |                     del files[index] | 
 |                 else: | 
 |                     index += 1 | 
 |  | 
 |  | 
 |         # Generate the revision list. | 
 |         logger.info("Analyzing commits from %s..." % name) | 
 |         top_revision = revision or branch | 
 |         if not check_rev_branch(name, ldir, top_revision, branch): | 
 |             sys.exit(1) | 
 |  | 
 |         last_revision = repo['last_revision'] | 
 |         rev_list_args = "--full-history --sparse --topo-order --reverse" | 
 |         if not last_revision: | 
 |             logger.info("Warning: last_revision of component %s is not set, starting from the first commit" % name) | 
 |             rev_list_args = rev_list_args + ' ' + top_revision | 
 |         else: | 
 |             if not check_rev_branch(name, ldir, last_revision, branch): | 
 |                 sys.exit(1) | 
 |             rev_list_args = "%s %s..%s" % (rev_list_args, last_revision, top_revision) | 
 |  | 
 |             # By definition, the current HEAD contains the latest imported | 
 |             # commit of each component. We use that as initial mapping even | 
 |             # though the commits do not match exactly because | 
 |             # a) it always works (in contrast to find_revs, which relies on special | 
 |             #    commit messages) | 
 |             # b) it is faster than find_revs, which will only be called on demand | 
 |             #    and can be skipped entirely in most cases | 
 |             # c) last but not least, the combined history looks nicer when all | 
 |             #    new commits are rooted in the same merge commit | 
 |             old2new_revs[last_revision] = head | 
 |  | 
 |         # We care about all commits (--full-history and --sparse) and | 
 |         # we want reconstruct the topology and thus do not care | 
 |         # about ordering by time (--topo-order). We ask for the ones | 
 |         # we need to import first to be listed first (--reverse). | 
 |         revs = runcmd("git rev-list %s" % rev_list_args, **largs).split() | 
 |         logger.debug("To be imported: %s" % revs) | 
 |         # Now 'revs' contains all revisions reachable from the top revision. | 
 |         # All revisions derived from the 'last_revision' definitely are new, | 
 |         # whereas the others may or may not have been imported before. For | 
 |         # a linear history in the component, that second set will be empty. | 
 |         # To distinguish between them, we also get the shorter list | 
 |         # of revisions starting at the ancestor. | 
 |         if last_revision: | 
 |             ancestor_revs = runcmd("git rev-list --ancestry-path %s" % rev_list_args, **largs).split() | 
 |         else: | 
 |             ancestor_revs = [] | 
 |         logger.debug("Ancestors: %s" % ancestor_revs) | 
 |  | 
 |         # Now import each revision. | 
 |         logger.info("Importing commits from %s..." % name) | 
 |         def import_rev(rev): | 
 |             global scanned_revs | 
 |  | 
 |             # If it is part of the new commits, we definitely need | 
 |             # to import it. Otherwise we need to check, we might have | 
 |             # imported it before. If it was imported and we merely | 
 |             # fail to find it because commit messages did not track | 
 |             # the mapping, then we end up importing it again. So | 
 |             # combined repos using "updating with history" really should | 
 |             # enable the "From ... rev:" commit header modifications. | 
 |             if rev not in ancestor_revs and rev not in old2new_revs and not scanned_revs: | 
 |                 logger.debug("Revision %s triggers log analysis." % rev) | 
 |                 find_revs(old2new_revs, head) | 
 |                 scanned_revs = True | 
 |             new_rev = old2new_revs.get(rev, None) | 
 |             if new_rev: | 
 |                 return new_rev | 
 |  | 
 |             # If the commit is not in the original list of revisions | 
 |             # to be imported, then it must be a parent of one of those | 
 |             # commits and it was skipped during earlier imports or not | 
 |             # found. Importing such merge commits leads to very ugly | 
 |             # history (long cascade of merge commits which all point | 
 |             # to to older commits) when switching from "update via | 
 |             # patches" to "update with history". | 
 |             # | 
 |             # We can avoid importing merge commits if all non-merge commits | 
 |             # reachable from it were already imported. In that case we | 
 |             # can root the new commits in the current head revision. | 
 |             def is_imported(prev): | 
 |                 parents = runcmd("git show --no-patch --pretty=format:%P " + prev, **largs).split() | 
 |                 if len(parents) > 1: | 
 |                     for p in parents: | 
 |                         if not is_imported(p): | 
 |                             logger.debug("Must import %s because %s is not imported." % (rev, p)) | 
 |                             return False | 
 |                     return True | 
 |                 elif prev in old2new_revs: | 
 |                     return True | 
 |                 else: | 
 |                     logger.debug("Must import %s because %s is not imported." % (rev, prev)) | 
 |                     return False | 
 |             if rev not in revs and is_imported(rev): | 
 |                 old2new_revs[rev] = head | 
 |                 return head | 
 |  | 
 |             # Need to import rev. Collect some information about it. | 
 |             logger.debug("Importing %s" % rev) | 
 |             (parents, author_name, author_email, author_timestamp, body) = \ | 
 |                 runcmd("git show --no-patch --pretty=format:%P%x00%an%x00%ae%x00%at%x00%B " + rev, **largs).split(chr(0)) | 
 |             parents = parents.split() | 
 |             if parents: | 
 |                 # Arbitrarily pick the first parent as base. It may or may not have | 
 |                 # been imported before. For example, if the parent is a merge commit | 
 |                 # and previously the combined repository used patching as update | 
 |                 # method, then the actual merge commit parent never was imported. | 
 |                 # To cover this, We recursively import parents. | 
 |                 parent = parents[0] | 
 |                 new_parent = import_rev(parent) | 
 |                 # Clean index and working tree. TODO: can we combine this and the | 
 |                 # next into one command with less file IO? | 
 |                 # "git reset --hard" does not work, it changes HEAD of the parent | 
 |                 # repo, which we wanted to avoid. Probably need to keep | 
 |                 # track of the rev that corresponds to the index and use apply_commit(). | 
 |                 runcmd("git rm -q --ignore-unmatch -rf .", **wargs) | 
 |                 # Update index and working tree to match the parent. | 
 |                 runcmd("git checkout -q -f %s ." % new_parent, **wargs) | 
 |             else: | 
 |                 parent = None | 
 |                 # Clean index and working tree. | 
 |                 runcmd("git rm -q --ignore-unmatch -rf .", **wargs) | 
 |  | 
 |             # Modify index and working tree such that it mirrors the commit. | 
 |             apply_commit(parent, rev, largs, wargs, dest_dir, file_filter=file_filter) | 
 |  | 
 |             # Now commit. | 
 |             new_tree = runcmd("git write-tree", **wargs).strip() | 
 |             env = copy.deepcopy(wenv) | 
 |             env['GIT_AUTHOR_NAME'] = author_name | 
 |             env['GIT_AUTHOR_EMAIL'] = author_email | 
 |             env['GIT_AUTHOR_DATE'] = author_timestamp | 
 |             if hook: | 
 |                 # Need to turn the verbatim commit message into something resembling a patch header | 
 |                 # for the hook. | 
 |                 with tempfile.NamedTemporaryFile(delete=False) as patch: | 
 |                     patch.write('Subject: [PATCH] ') | 
 |                     patch.write(body) | 
 |                     patch.write('\n---\n') | 
 |                     patch.close() | 
 |                     runcmd([hook, patch.name, rev, name]) | 
 |                     with open(patch.name) as f: | 
 |                         body = f.read()[len('Subject: [PATCH] '):][:-len('\n---\n')] | 
 |  | 
 |             # We can skip non-merge commits that did not change any files. Those are typically | 
 |             # the result of file filtering, although they could also have been introduced | 
 |             # intentionally upstream, in which case we drop some information here. | 
 |             if len(parents) == 1: | 
 |                 parent_rev = import_rev(parents[0]) | 
 |                 old_tree = runcmd("git show -s --pretty=format:%T " + parent_rev, **wargs).strip() | 
 |                 commit = old_tree != new_tree | 
 |                 if not commit: | 
 |                     new_rev = parent_rev | 
 |             else: | 
 |                 commit = True | 
 |             if commit: | 
 |                 new_rev = runcmd("git commit-tree".split() + add_p([import_rev(p) for p in parents]) + | 
 |                                  ["-m", body, new_tree], | 
 |                                  env=env).strip() | 
 |             old2new_revs[rev] = new_rev | 
 |  | 
 |             return new_rev | 
 |  | 
 |         if revs: | 
 |             for rev in revs: | 
 |                 import_rev(rev) | 
 |             # Remember how to update our current head. New components get added, | 
 |             # updated components get the delta between current head and the updated component | 
 |             # applied. | 
 |             additional_heads[old2new_revs[revs[-1]]] = head if repo['last_revision'] else None | 
 |             repo['last_revision'] = revs[-1] | 
 |  | 
 |     # Now construct the final merge commit. We create the tree by | 
 |     # starting with the head and applying the changes from each | 
 |     # components imported head revision. | 
 |     if additional_heads: | 
 |         runcmd("git reset --hard", **wargs) | 
 |         for rev, base in additional_heads.items(): | 
 |             apply_commit(base, rev, wargs, wargs, None) | 
 |  | 
 |         # Commit with all component branches as parents as well as the previous head. | 
 |         logger.info("Writing final merge commit...") | 
 |         msg = conf_commit_msg(conf, components) | 
 |         new_tree = runcmd("git write-tree", **wargs).strip() | 
 |         new_rev = runcmd("git commit-tree".split() + | 
 |                          add_p([head] + list(additional_heads.keys())) + | 
 |                          ["-m", msg, new_tree], | 
 |                          **wargs).strip() | 
 |         # And done! This is the first time we change the HEAD in the actual work tree. | 
 |         runcmd("git reset --hard %s" % new_rev) | 
 |  | 
 |         # Update and stage the (potentially modified) | 
 |         # combo-layer.conf, but do not commit separately. | 
 |         for name in repos: | 
 |             repo = conf.repos[name] | 
 |             rev = repo['last_revision'] | 
 |             conf.update(name, "last_revision", rev) | 
 |         if commit_conf_file(conf, components, False): | 
 |             # Must augment the previous commit. | 
 |             runcmd("git commit --amend -C HEAD") | 
 |  | 
 |  | 
 | scanned_revs = False | 
 | def find_revs(old2new, head): | 
 |     '''Construct mapping from original commit hash to commit hash in | 
 |     combined repo by looking at the commit messages. Depends on the | 
 |     "From ... rev: ..." convention.''' | 
 |     logger.info("Analyzing log messages to find previously imported commits...") | 
 |     num_known = len(old2new) | 
 |     log = runcmd("git log --grep='From .* rev: [a-fA-F0-9][a-fA-F0-9]*' --pretty=format:%H%x00%B%x00 " + head).split(chr(0)) | 
 |     regex = re.compile(r'From .* rev: ([a-fA-F0-9]+)') | 
 |     for new_rev, body in zip(*[iter(log)]* 2): | 
 |         # Use the last one, in the unlikely case there are more than one. | 
 |         rev = regex.findall(body)[-1] | 
 |         if rev not in old2new: | 
 |             old2new[rev] = new_rev.strip() | 
 |     logger.info("Found %d additional commits, leading to: %s" % (len(old2new) - num_known, old2new)) | 
 |  | 
 |  | 
 | def apply_commit(parent, rev, largs, wargs, dest_dir, file_filter=None): | 
 |     '''Compare revision against parent, remove files deleted in the | 
 |     commit, re-write new or modified ones. Moves them into dest_dir. | 
 |     Optionally filters files. | 
 |     ''' | 
 |     if not dest_dir: | 
 |         dest_dir = "." | 
 |     # -r recurses into sub-directories, given is the full overview of | 
 |     # what changed.  We do not care about copy/edits or renames, so we | 
 |     # can disable those with --no-renames (but we still parse them, | 
 |     # because it was not clear from git documentation whether C and M | 
 |     # lines can still occur). | 
 |     logger.debug("Applying changes between %s and %s in %s" % (parent, rev, largs["destdir"])) | 
 |     delete = [] | 
 |     update = [] | 
 |     if parent: | 
 |         # Apply delta. | 
 |         changes = runcmd("git diff-tree --no-commit-id --no-renames --name-status -r --raw -z %s %s" % (parent, rev), **largs).split(chr(0)) | 
 |         for status, name in zip(*[iter(changes)]*2): | 
 |             if status[0] in "ACMRT": | 
 |                 update.append(name) | 
 |             elif status[0] in "D": | 
 |                 delete.append(name) | 
 |             else: | 
 |                 logger.error("Unknown status %s of file %s in revision %s" % (status, name, rev)) | 
 |                 sys.exit(1) | 
 |     else: | 
 |         # Copy all files. | 
 |         update.extend(runcmd("git ls-tree -r --name-only -z %s" % rev, **largs).split(chr(0))) | 
 |  | 
 |     # Include/exclude files as define in the component config. | 
 |     # Both updated and deleted file lists get filtered, because it might happen | 
 |     # that a file gets excluded, pulled from a different component, and then the | 
 |     # excluded file gets deleted. In that case we must keep the copy. | 
 |     if file_filter: | 
 |         file_filter(update) | 
 |         file_filter(delete) | 
 |  | 
 |     # We export into a tar archive here and extract with tar because it is simple (no | 
 |     # need to implement file and symlink writing ourselves) and gives us some degree | 
 |     # of parallel IO. The downside is that we have to pass the list of files via | 
 |     # command line parameters - hopefully there will never be too many at once. | 
 |     if update: | 
 |         target = os.path.join(wargs["destdir"], dest_dir) | 
 |         if not os.path.isdir(target): | 
 |             os.makedirs(target) | 
 |         quoted_target = pipes.quote(target) | 
 |         # os.sysconf('SC_ARG_MAX') is lying: running a command with | 
 |         # string length 629343 already failed with "Argument list too | 
 |         # long" although SC_ARG_MAX = 2097152. "man execve" explains | 
 |         # the limitations, but those are pretty complicated. So here | 
 |         # we just hard-code a fixed value which is more likely to work. | 
 |         max_cmdsize = 64 * 1024 | 
 |         while update: | 
 |             quoted_args = [] | 
 |             unquoted_args = [] | 
 |             cmdsize = 100 + len(quoted_target) | 
 |             while update: | 
 |                 quoted_next = pipes.quote(update[0]) | 
 |                 size_next = len(quoted_next) + len(dest_dir) + 1 | 
 |                 logger.debug('cmdline length %d + %d < %d?' % (cmdsize, size_next, os.sysconf('SC_ARG_MAX'))) | 
 |                 if cmdsize + size_next < max_cmdsize: | 
 |                     quoted_args.append(quoted_next) | 
 |                     unquoted_args.append(update.pop(0)) | 
 |                     cmdsize += size_next | 
 |                 else: | 
 |                     logger.debug('Breaking the cmdline at length %d' % cmdsize) | 
 |                     break | 
 |             logger.debug('Final cmdline length %d / %d' % (cmdsize, os.sysconf('SC_ARG_MAX'))) | 
 |             cmd = "git archive %s %s | tar -C %s -xf -" % (rev, ' '.join(quoted_args), quoted_target) | 
 |             logger.debug('First cmdline length %d' % len(cmd)) | 
 |             runcmd(cmd, **largs) | 
 |             cmd = "git add -f".split() + [os.path.join(dest_dir, x) for x in unquoted_args] | 
 |             logger.debug('Second cmdline length %d' % reduce(lambda x, y: x + len(y), cmd, 0)) | 
 |             runcmd(cmd, **wargs) | 
 |     if delete: | 
 |         for path in delete: | 
 |             if dest_dir: | 
 |                 path = os.path.join(dest_dir, path) | 
 |         runcmd("git rm -f --ignore-unmatch".split() + [os.path.join(dest_dir, x) for x in delete], **wargs) | 
 |  | 
 | def action_error(conf, args): | 
 |     logger.info("invalid action %s" % args[0]) | 
 |  | 
 | actions = { | 
 |     "init": action_init, | 
 |     "update": action_update, | 
 |     "pull": action_pull, | 
 |     "splitpatch": action_splitpatch, | 
 | } | 
 |  | 
 | def main(): | 
 |     parser = optparse.OptionParser( | 
 |         version = "Combo Layer Repo Tool version %s" % __version__, | 
 |         usage = """%prog [options] action | 
 |  | 
 | Create and update a combination layer repository from multiple component repositories. | 
 |  | 
 | Action: | 
 |   init                 initialise the combo layer repo | 
 |   update [components]  get patches from component repos and apply them to the combo repo | 
 |   pull [components]    just pull component repos only | 
 |   splitpatch [commit]  generate commit patch and split per component, default commit is HEAD""") | 
 |  | 
 |     parser.add_option("-c", "--conf", help = "specify the config file (conf/combo-layer.conf is the default).", | 
 |                action = "store", dest = "conffile", default = "conf/combo-layer.conf") | 
 |  | 
 |     parser.add_option("-i", "--interactive", help = "interactive mode, user can edit the patch list and patches", | 
 |                action = "store_true", dest = "interactive", default = False) | 
 |  | 
 |     parser.add_option("-D", "--debug", help = "output debug information", | 
 |                action = "store_true", dest = "debug", default = False) | 
 |  | 
 |     parser.add_option("-n", "--no-pull", help = "skip pulling component repos during update", | 
 |                action = "store_true", dest = "nopull", default = False) | 
 |  | 
 |     parser.add_option("--hard-reset", | 
 |                help = "instead of pull do fetch and hard-reset in component repos", | 
 |                action = "store_true", dest = "hard_reset", default = False) | 
 |  | 
 |     parser.add_option("-H", "--history", help = "import full history of components during init", | 
 |                       action = "store_true", default = False) | 
 |  | 
 |     options, args = parser.parse_args(sys.argv) | 
 |  | 
 |     # Dispatch to action handler | 
 |     if len(args) == 1: | 
 |         logger.error("No action specified, exiting") | 
 |         parser.print_help() | 
 |     elif args[1] not in actions: | 
 |         logger.error("Unsupported action %s, exiting\n" % (args[1])) | 
 |         parser.print_help() | 
 |     elif not os.path.exists(options.conffile): | 
 |         logger.error("No valid config file, exiting\n") | 
 |         parser.print_help() | 
 |     else: | 
 |         if options.debug: | 
 |             logger.setLevel(logging.DEBUG) | 
 |         confdata = Configuration(options) | 
 |         initmode = (args[1] == 'init') | 
 |         confdata.sanity_check(initmode) | 
 |         actions.get(args[1], action_error)(confdata, args[1:]) | 
 |  | 
 | if __name__ == "__main__": | 
 |     try: | 
 |         ret = main() | 
 |     except Exception: | 
 |         ret = 1 | 
 |         import traceback | 
 |         traceback.print_exc() | 
 |     sys.exit(ret) |