forked from brl/citadel
1377 lines
60 KiB
Plaintext
1377 lines
60 KiB
Plaintext
|
#!/usr/bin/env python3
|
||
|
# ex:ts=4:sw=4:sts=4:et
|
||
|
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
|
||
|
#
|
||
|
# Copyright 2011 Intel Corporation
|
||
|
# Authored-by: Yu Ke <ke.yu@intel.com>
|
||
|
# Paul Eggleton <paul.eggleton@intel.com>
|
||
|
# Richard Purdie <richard.purdie@intel.com>
|
||
|
#
|
||
|
# This program is free software; you can redistribute it and/or modify
|
||
|
# it under the terms of the GNU General Public License version 2 as
|
||
|
# published by the Free Software Foundation.
|
||
|
#
|
||
|
# This program is distributed in the hope that it will be useful,
|
||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
# GNU General Public License for more details.
|
||
|
#
|
||
|
# You should have received a copy of the GNU General Public License along
|
||
|
# with this program; if not, write to the Free Software Foundation, Inc.,
|
||
|
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
||
|
|
||
|
import fnmatch
|
||
|
import os, sys
|
||
|
import optparse
|
||
|
import logging
|
||
|
import subprocess
|
||
|
import tempfile
|
||
|
import configparser
|
||
|
import re
|
||
|
import copy
|
||
|
import pipes
|
||
|
import shutil
|
||
|
from collections import OrderedDict
|
||
|
from string import Template
|
||
|
from functools import reduce
|
||
|
|
||
|
__version__ = "0.2.1"
|
||
|
|
||
|
def logger_create():
|
||
|
logger = logging.getLogger("")
|
||
|
loggerhandler = logging.StreamHandler()
|
||
|
loggerhandler.setFormatter(logging.Formatter("[%(asctime)s] %(message)s","%H:%M:%S"))
|
||
|
logger.addHandler(loggerhandler)
|
||
|
logger.setLevel(logging.INFO)
|
||
|
return logger
|
||
|
|
||
|
logger = logger_create()
|
||
|
|
||
|
def get_current_branch(repodir=None):
|
||
|
try:
|
||
|
if not os.path.exists(os.path.join(repodir if repodir else '', ".git")):
|
||
|
# Repo not created yet (i.e. during init) so just assume master
|
||
|
return "master"
|
||
|
branchname = runcmd("git symbolic-ref HEAD 2>/dev/null", repodir).strip()
|
||
|
if branchname.startswith("refs/heads/"):
|
||
|
branchname = branchname[11:]
|
||
|
return branchname
|
||
|
except subprocess.CalledProcessError:
|
||
|
return ""
|
||
|
|
||
|
class Configuration(object):
|
||
|
"""
|
||
|
Manages the configuration
|
||
|
|
||
|
For an example config file, see combo-layer.conf.example
|
||
|
|
||
|
"""
|
||
|
def __init__(self, options):
|
||
|
for key, val in options.__dict__.items():
|
||
|
setattr(self, key, val)
|
||
|
|
||
|
def readsection(parser, section, repo):
|
||
|
for (name, value) in parser.items(section):
|
||
|
if value.startswith("@"):
|
||
|
self.repos[repo][name] = eval(value.strip("@"))
|
||
|
else:
|
||
|
# Apply special type transformations for some properties.
|
||
|
# Type matches the RawConfigParser.get*() methods.
|
||
|
types = {'signoff': 'boolean', 'update': 'boolean', 'history': 'boolean'}
|
||
|
if name in types:
|
||
|
value = getattr(parser, 'get' + types[name])(section, name)
|
||
|
self.repos[repo][name] = value
|
||
|
|
||
|
def readglobalsection(parser, section):
|
||
|
for (name, value) in parser.items(section):
|
||
|
if name == "commit_msg":
|
||
|
self.commit_msg_template = value
|
||
|
|
||
|
logger.debug("Loading config file %s" % self.conffile)
|
||
|
self.parser = configparser.ConfigParser()
|
||
|
with open(self.conffile) as f:
|
||
|
self.parser.readfp(f)
|
||
|
|
||
|
# initialize default values
|
||
|
self.commit_msg_template = "Automatic commit to update last_revision"
|
||
|
|
||
|
self.repos = {}
|
||
|
for repo in self.parser.sections():
|
||
|
if repo == "combo-layer-settings":
|
||
|
# special handling for global settings
|
||
|
readglobalsection(self.parser, repo)
|
||
|
else:
|
||
|
self.repos[repo] = {}
|
||
|
readsection(self.parser, repo, repo)
|
||
|
|
||
|
# Load local configuration, if available
|
||
|
self.localconffile = None
|
||
|
self.localparser = None
|
||
|
self.combobranch = None
|
||
|
if self.conffile.endswith('.conf'):
|
||
|
lcfile = self.conffile.replace('.conf', '-local.conf')
|
||
|
if os.path.exists(lcfile):
|
||
|
# Read combo layer branch
|
||
|
self.combobranch = get_current_branch()
|
||
|
logger.debug("Combo layer branch is %s" % self.combobranch)
|
||
|
|
||
|
self.localconffile = lcfile
|
||
|
logger.debug("Loading local config file %s" % self.localconffile)
|
||
|
self.localparser = configparser.ConfigParser()
|
||
|
with open(self.localconffile) as f:
|
||
|
self.localparser.readfp(f)
|
||
|
|
||
|
for section in self.localparser.sections():
|
||
|
if '|' in section:
|
||
|
sectionvals = section.split('|')
|
||
|
repo = sectionvals[0]
|
||
|
if sectionvals[1] != self.combobranch:
|
||
|
continue
|
||
|
else:
|
||
|
repo = section
|
||
|
if repo in self.repos:
|
||
|
readsection(self.localparser, section, repo)
|
||
|
|
||
|
def update(self, repo, option, value, initmode=False):
|
||
|
# If the main config has the option already, that is what we
|
||
|
# are expected to modify.
|
||
|
if self.localparser and not self.parser.has_option(repo, option):
|
||
|
parser = self.localparser
|
||
|
section = "%s|%s" % (repo, self.combobranch)
|
||
|
conffile = self.localconffile
|
||
|
if initmode and not parser.has_section(section):
|
||
|
parser.add_section(section)
|
||
|
else:
|
||
|
parser = self.parser
|
||
|
section = repo
|
||
|
conffile = self.conffile
|
||
|
parser.set(section, option, value)
|
||
|
with open(conffile, "w") as f:
|
||
|
parser.write(f)
|
||
|
self.repos[repo][option] = value
|
||
|
|
||
|
def sanity_check(self, initmode=False):
|
||
|
required_options=["src_uri", "local_repo_dir", "dest_dir", "last_revision"]
|
||
|
if initmode:
|
||
|
required_options.remove("last_revision")
|
||
|
msg = ""
|
||
|
missing_options = []
|
||
|
for name in self.repos:
|
||
|
for option in required_options:
|
||
|
if option not in self.repos[name]:
|
||
|
msg = "%s\nOption %s is not defined for component %s" %(msg, option, name)
|
||
|
missing_options.append(option)
|
||
|
# Sanitize dest_dir so that we do not have to deal with edge cases
|
||
|
# (unset, empty string, double slashes) in the rest of the code.
|
||
|
# It not being set will still be flagged as error because it is
|
||
|
# listed as required option above; that could be changed now.
|
||
|
dest_dir = os.path.normpath(self.repos[name].get("dest_dir", "."))
|
||
|
self.repos[name]["dest_dir"] = "." if not dest_dir else dest_dir
|
||
|
if msg != "":
|
||
|
logger.error("configuration file %s has the following error: %s" % (self.conffile,msg))
|
||
|
if self.localconffile and 'last_revision' in missing_options:
|
||
|
logger.error("local configuration file %s may be missing configuration for combo branch %s" % (self.localconffile, self.combobranch))
|
||
|
sys.exit(1)
|
||
|
|
||
|
# filterdiff is required by action_splitpatch, so check its availability
|
||
|
if subprocess.call("which filterdiff > /dev/null 2>&1", shell=True) != 0:
|
||
|
logger.error("ERROR: patchutils package is missing, please install it (e.g. # apt-get install patchutils)")
|
||
|
sys.exit(1)
|
||
|
|
||
|
def runcmd(cmd,destdir=None,printerr=True,out=None,env=None):
|
||
|
"""
|
||
|
execute command, raise CalledProcessError if fail
|
||
|
return output if succeed
|
||
|
"""
|
||
|
logger.debug("run cmd '%s' in %s" % (cmd, os.getcwd() if destdir is None else destdir))
|
||
|
if not out:
|
||
|
out = tempfile.TemporaryFile()
|
||
|
err = out
|
||
|
else:
|
||
|
err = tempfile.TemporaryFile()
|
||
|
try:
|
||
|
subprocess.check_call(cmd, stdout=out, stderr=err, cwd=destdir, shell=isinstance(cmd, str), env=env or os.environ)
|
||
|
except subprocess.CalledProcessError as e:
|
||
|
err.seek(0)
|
||
|
if printerr:
|
||
|
logger.error("%s" % err.read())
|
||
|
raise e
|
||
|
|
||
|
err.seek(0)
|
||
|
output = err.read().decode('utf-8')
|
||
|
logger.debug("output: %s" % output.replace(chr(0), '\\0'))
|
||
|
return output
|
||
|
|
||
|
def action_init(conf, args):
|
||
|
"""
|
||
|
Clone component repositories
|
||
|
Check git is initialised; if not, copy initial data from component repos
|
||
|
"""
|
||
|
for name in conf.repos:
|
||
|
ldir = conf.repos[name]['local_repo_dir']
|
||
|
if not os.path.exists(ldir):
|
||
|
logger.info("cloning %s to %s" %(conf.repos[name]['src_uri'], ldir))
|
||
|
subprocess.check_call("git clone %s %s" % (conf.repos[name]['src_uri'], ldir), shell=True)
|
||
|
if not os.path.exists(".git"):
|
||
|
runcmd("git init")
|
||
|
if conf.history:
|
||
|
# Need a common ref for all trees.
|
||
|
runcmd('git commit -m "initial empty commit" --allow-empty')
|
||
|
startrev = runcmd('git rev-parse master').strip()
|
||
|
|
||
|
for name in conf.repos:
|
||
|
repo = conf.repos[name]
|
||
|
ldir = repo['local_repo_dir']
|
||
|
branch = repo.get('branch', "master")
|
||
|
lastrev = repo.get('last_revision', None)
|
||
|
if lastrev and lastrev != "HEAD":
|
||
|
initialrev = lastrev
|
||
|
if branch:
|
||
|
if not check_rev_branch(name, ldir, lastrev, branch):
|
||
|
sys.exit(1)
|
||
|
logger.info("Copying data from %s at specified revision %s..." % (name, lastrev))
|
||
|
else:
|
||
|
lastrev = None
|
||
|
initialrev = branch
|
||
|
logger.info("Copying data from %s..." % name)
|
||
|
# Sanity check initialrev and turn it into hash (required for copying history,
|
||
|
# because resolving a name ref only works in the component repo).
|
||
|
rev = runcmd('git rev-parse %s' % initialrev, ldir).strip()
|
||
|
if rev != initialrev:
|
||
|
try:
|
||
|
refs = runcmd('git show-ref -s %s' % initialrev, ldir).split('\n')
|
||
|
if len(set(refs)) > 1:
|
||
|
# Happens for example when configured to track
|
||
|
# "master" and there is a refs/heads/master. The
|
||
|
# traditional behavior from "git archive" (preserved
|
||
|
# here) it to choose the first one. This might not be
|
||
|
# intended, so at least warn about it.
|
||
|
logger.warn("%s: initial revision '%s' not unique, picking result of rev-parse = %s" %
|
||
|
(name, initialrev, refs[0]))
|
||
|
initialrev = rev
|
||
|
except:
|
||
|
# show-ref fails for hashes. Skip the sanity warning in that case.
|
||
|
pass
|
||
|
initialrev = rev
|
||
|
dest_dir = repo['dest_dir']
|
||
|
if dest_dir != ".":
|
||
|
extract_dir = os.path.join(os.getcwd(), dest_dir)
|
||
|
if not os.path.exists(extract_dir):
|
||
|
os.makedirs(extract_dir)
|
||
|
else:
|
||
|
extract_dir = os.getcwd()
|
||
|
file_filter = repo.get('file_filter', "")
|
||
|
exclude_patterns = repo.get('file_exclude', '').split()
|
||
|
def copy_selected_files(initialrev, extract_dir, file_filter, exclude_patterns, ldir,
|
||
|
subdir=""):
|
||
|
# When working inside a filtered branch which had the
|
||
|
# files already moved, we need to prepend the
|
||
|
# subdirectory to all filters, otherwise they would
|
||
|
# not match.
|
||
|
if subdir == '.':
|
||
|
subdir = ''
|
||
|
elif subdir:
|
||
|
subdir = os.path.normpath(subdir)
|
||
|
file_filter = ' '.join([subdir + '/' + x for x in file_filter.split()])
|
||
|
exclude_patterns = [subdir + '/' + x for x in exclude_patterns]
|
||
|
# To handle both cases, we cd into the target
|
||
|
# directory and optionally tell tar to strip the path
|
||
|
# prefix when the files were already moved.
|
||
|
subdir_components = len(subdir.split(os.path.sep)) if subdir else 0
|
||
|
strip=('--strip-components=%d' % subdir_components) if subdir else ''
|
||
|
# TODO: file_filter wild cards do not work (and haven't worked before either), because
|
||
|
# a) GNU tar requires a --wildcards parameter before turning on wild card matching.
|
||
|
# b) The semantic is not as intendend (src/*.c also matches src/foo/bar.c,
|
||
|
# in contrast to the other use of file_filter as parameter of "git archive"
|
||
|
# where it only matches .c files directly in src).
|
||
|
files = runcmd("git archive %s %s | tar -x -v %s -C %s %s" %
|
||
|
(initialrev, subdir,
|
||
|
strip, extract_dir, file_filter),
|
||
|
ldir)
|
||
|
if exclude_patterns:
|
||
|
# Implement file removal by letting tar create the
|
||
|
# file and then deleting it in the file system
|
||
|
# again. Uses the list of files created by tar (easier
|
||
|
# than walking the tree).
|
||
|
for file in files.split('\n'):
|
||
|
if file.endswith(os.path.sep):
|
||
|
continue
|
||
|
for pattern in exclude_patterns:
|
||
|
if fnmatch.fnmatch(file, pattern):
|
||
|
os.unlink(os.path.join(*([extract_dir] + ['..'] * subdir_components + [file])))
|
||
|
break
|
||
|
|
||
|
if not conf.history:
|
||
|
copy_selected_files(initialrev, extract_dir, file_filter, exclude_patterns, ldir)
|
||
|
else:
|
||
|
# First fetch remote history into local repository.
|
||
|
# We need a ref for that, so ensure that there is one.
|
||
|
refname = "combo-layer-init-%s" % name
|
||
|
runcmd("git branch -f %s %s" % (refname, initialrev), ldir)
|
||
|
runcmd("git fetch %s %s" % (ldir, refname))
|
||
|
runcmd("git branch -D %s" % refname, ldir)
|
||
|
# Make that the head revision.
|
||
|
runcmd("git checkout -b %s %s" % (name, initialrev))
|
||
|
# Optional: cut the history by replacing the given
|
||
|
# start point(s) with commits providing the same
|
||
|
# content (aka tree), but with commit information that
|
||
|
# makes it clear that this is an artifically created
|
||
|
# commit and nothing the original authors had anything
|
||
|
# to do with.
|
||
|
since_rev = repo.get('since_revision', '')
|
||
|
if since_rev:
|
||
|
committer = runcmd('git var GIT_AUTHOR_IDENT').strip()
|
||
|
# Same time stamp, no name.
|
||
|
author = re.sub('.* (\d+ [+-]\d+)', r'unknown <unknown> \1', committer)
|
||
|
logger.info('author %s' % author)
|
||
|
for rev in since_rev.split():
|
||
|
# Resolve in component repo...
|
||
|
rev = runcmd('git log --oneline --no-abbrev-commit -n1 %s' % rev, ldir).split()[0]
|
||
|
# ... and then get the tree in current
|
||
|
# one. The commit should be in both repos with
|
||
|
# the same tree, but better check here.
|
||
|
tree = runcmd('git show -s --pretty=format:%%T %s' % rev).strip()
|
||
|
with tempfile.NamedTemporaryFile(mode='wt') as editor:
|
||
|
editor.write('''cat >$1 <<EOF
|
||
|
tree %s
|
||
|
author %s
|
||
|
committer %s
|
||
|
|
||
|
%s: squashed import of component
|
||
|
|
||
|
This commit copies the entire set of files as found in
|
||
|
%s %s
|
||
|
|
||
|
For more information about previous commits, see the
|
||
|
upstream repository.
|
||
|
|
||
|
Commit created by combo-layer.
|
||
|
EOF
|
||
|
''' % (tree, author, committer, name, name, since_rev))
|
||
|
editor.flush()
|
||
|
os.environ['GIT_EDITOR'] = 'sh %s' % editor.name
|
||
|
runcmd('git replace --edit %s' % rev)
|
||
|
|
||
|
# Optional: rewrite history to change commit messages or to move files.
|
||
|
if 'hook' in repo or dest_dir != ".":
|
||
|
filter_branch = ['git', 'filter-branch', '--force']
|
||
|
with tempfile.NamedTemporaryFile(mode='wt') as hookwrapper:
|
||
|
if 'hook' in repo:
|
||
|
# Create a shell script wrapper around the original hook that
|
||
|
# can be used by git filter-branch. Hook may or may not have
|
||
|
# an absolute path.
|
||
|
hook = repo['hook']
|
||
|
hook = os.path.join(os.path.dirname(conf.conffile), '..', hook)
|
||
|
# The wrappers turns the commit message
|
||
|
# from stdin into a fake patch header.
|
||
|
# This is good enough for changing Subject
|
||
|
# and commit msg body with normal
|
||
|
# combo-layer hooks.
|
||
|
hookwrapper.write('''set -e
|
||
|
tmpname=$(mktemp)
|
||
|
trap "rm $tmpname" EXIT
|
||
|
echo -n 'Subject: [PATCH] ' >>$tmpname
|
||
|
cat >>$tmpname
|
||
|
if ! [ $(tail -c 1 $tmpname | od -A n -t x1) == '0a' ]; then
|
||
|
echo >>$tmpname
|
||
|
fi
|
||
|
echo '---' >>$tmpname
|
||
|
%s $tmpname $GIT_COMMIT %s
|
||
|
tail -c +18 $tmpname | head -c -4
|
||
|
''' % (hook, name))
|
||
|
hookwrapper.flush()
|
||
|
filter_branch.extend(['--msg-filter', 'bash %s' % hookwrapper.name])
|
||
|
if dest_dir != ".":
|
||
|
parent = os.path.dirname(dest_dir)
|
||
|
if not parent:
|
||
|
parent = '.'
|
||
|
# May run outside of the current directory, so do not assume that .git exists.
|
||
|
filter_branch.extend(['--tree-filter', 'mkdir -p .git/tmptree && find . -mindepth 1 -maxdepth 1 ! -name .git -print0 | xargs -0 -I SOURCE mv SOURCE .git/tmptree && mkdir -p %s && mv .git/tmptree %s' % (parent, dest_dir)])
|
||
|
filter_branch.append('HEAD')
|
||
|
runcmd(filter_branch)
|
||
|
runcmd('git update-ref -d refs/original/refs/heads/%s' % name)
|
||
|
repo['rewritten_revision'] = runcmd('git rev-parse HEAD').strip()
|
||
|
repo['stripped_revision'] = repo['rewritten_revision']
|
||
|
# Optional filter files: remove everything and re-populate using the normal filtering code.
|
||
|
# Override any potential .gitignore.
|
||
|
if file_filter or exclude_patterns:
|
||
|
runcmd('git rm -rf .')
|
||
|
if not os.path.exists(extract_dir):
|
||
|
os.makedirs(extract_dir)
|
||
|
copy_selected_files('HEAD', extract_dir, file_filter, exclude_patterns, '.',
|
||
|
subdir=dest_dir)
|
||
|
runcmd('git add --all --force .')
|
||
|
if runcmd('git status --porcelain'):
|
||
|
# Something to commit.
|
||
|
runcmd(['git', 'commit', '-m',
|
||
|
'''%s: select file subset
|
||
|
|
||
|
Files from the component repository were chosen based on
|
||
|
the following filters:
|
||
|
file_filter = %s
|
||
|
file_exclude = %s''' % (name, file_filter or '<empty>', repo.get('file_exclude', '<empty>'))])
|
||
|
repo['stripped_revision'] = runcmd('git rev-parse HEAD').strip()
|
||
|
|
||
|
if not lastrev:
|
||
|
lastrev = runcmd('git rev-parse %s' % initialrev, ldir).strip()
|
||
|
conf.update(name, "last_revision", lastrev, initmode=True)
|
||
|
|
||
|
if not conf.history:
|
||
|
runcmd("git add .")
|
||
|
else:
|
||
|
# Create Octopus merge commit according to http://stackoverflow.com/questions/10874149/git-octopus-merge-with-unrelated-repositoies
|
||
|
runcmd('git checkout master')
|
||
|
merge = ['git', 'merge', '--no-commit']
|
||
|
for name in conf.repos:
|
||
|
repo = conf.repos[name]
|
||
|
# Use branch created earlier.
|
||
|
merge.append(name)
|
||
|
# Root all commits which have no parent in the common
|
||
|
# ancestor in the new repository.
|
||
|
for start in runcmd('git log --pretty=format:%%H --max-parents=0 %s --' % name).split('\n'):
|
||
|
runcmd('git replace --graft %s %s' % (start, startrev))
|
||
|
try:
|
||
|
runcmd(merge)
|
||
|
except Exception as error:
|
||
|
logger.info('''Merging component repository history failed, perhaps because of merge conflicts.
|
||
|
It may be possible to commit anyway after resolving these conflicts.
|
||
|
|
||
|
%s''' % error)
|
||
|
# Create MERGE_HEAD and MERGE_MSG. "git merge" itself
|
||
|
# does not create MERGE_HEAD in case of a (harmless) failure,
|
||
|
# and we want certain auto-generated information in the
|
||
|
# commit message for future reference and/or automation.
|
||
|
with open('.git/MERGE_HEAD', 'w') as head:
|
||
|
with open('.git/MERGE_MSG', 'w') as msg:
|
||
|
msg.write('repo: initial import of components\n\n')
|
||
|
# head.write('%s\n' % startrev)
|
||
|
for name in conf.repos:
|
||
|
repo = conf.repos[name]
|
||
|
# <upstream ref> <rewritten ref> <rewritten + files removed>
|
||
|
msg.write('combo-layer-%s: %s %s %s\n' % (name,
|
||
|
repo['last_revision'],
|
||
|
repo['rewritten_revision'],
|
||
|
repo['stripped_revision']))
|
||
|
rev = runcmd('git rev-parse %s' % name).strip()
|
||
|
head.write('%s\n' % rev)
|
||
|
|
||
|
if conf.localconffile:
|
||
|
localadded = True
|
||
|
try:
|
||
|
runcmd("git rm --cached %s" % conf.localconffile, printerr=False)
|
||
|
except subprocess.CalledProcessError:
|
||
|
localadded = False
|
||
|
if localadded:
|
||
|
localrelpath = os.path.relpath(conf.localconffile)
|
||
|
runcmd("grep -q %s .gitignore || echo %s >> .gitignore" % (localrelpath, localrelpath))
|
||
|
runcmd("git add .gitignore")
|
||
|
logger.info("Added local configuration file %s to .gitignore", localrelpath)
|
||
|
logger.info("Initial combo layer repository data has been created; please make any changes if desired and then use 'git commit' to make the initial commit.")
|
||
|
else:
|
||
|
logger.info("Repository already initialised, nothing to do.")
|
||
|
|
||
|
|
||
|
def check_repo_clean(repodir):
|
||
|
"""
|
||
|
check if the repo is clean
|
||
|
exit if repo is dirty
|
||
|
"""
|
||
|
output=runcmd("git status --porcelain", repodir)
|
||
|
r = re.compile('\?\? patch-.*/')
|
||
|
dirtyout = [item for item in output.splitlines() if not r.match(item)]
|
||
|
if dirtyout:
|
||
|
logger.error("git repo %s is dirty, please fix it first", repodir)
|
||
|
sys.exit(1)
|
||
|
|
||
|
def check_patch(patchfile):
|
||
|
f = open(patchfile, 'rb')
|
||
|
ln = f.readline()
|
||
|
of = None
|
||
|
in_patch = False
|
||
|
beyond_msg = False
|
||
|
pre_buf = b''
|
||
|
while ln:
|
||
|
if not beyond_msg:
|
||
|
if ln == b'---\n':
|
||
|
if not of:
|
||
|
break
|
||
|
in_patch = False
|
||
|
beyond_msg = True
|
||
|
elif ln.startswith(b'--- '):
|
||
|
# We have a diff in the commit message
|
||
|
in_patch = True
|
||
|
if not of:
|
||
|
print('WARNING: %s contains a diff in its commit message, indenting to avoid failure during apply' % patchfile)
|
||
|
of = open(patchfile + '.tmp', 'wb')
|
||
|
of.write(pre_buf)
|
||
|
pre_buf = b''
|
||
|
elif in_patch and not ln[0] in b'+-@ \n\r':
|
||
|
in_patch = False
|
||
|
if of:
|
||
|
if in_patch:
|
||
|
of.write(b' ' + ln)
|
||
|
else:
|
||
|
of.write(ln)
|
||
|
else:
|
||
|
pre_buf += ln
|
||
|
ln = f.readline()
|
||
|
f.close()
|
||
|
if of:
|
||
|
of.close()
|
||
|
os.rename(patchfile + '.tmp', patchfile)
|
||
|
|
||
|
def drop_to_shell(workdir=None):
|
||
|
if not sys.stdin.isatty():
|
||
|
print("Not a TTY so can't drop to shell for resolution, exiting.")
|
||
|
return False
|
||
|
|
||
|
shell = os.environ.get('SHELL', 'bash')
|
||
|
print('Dropping to shell "%s"\n' \
|
||
|
'When you are finished, run the following to continue:\n' \
|
||
|
' exit -- continue to apply the patches\n' \
|
||
|
' exit 1 -- abort\n' % shell);
|
||
|
ret = subprocess.call([shell], cwd=workdir)
|
||
|
if ret != 0:
|
||
|
print("Aborting")
|
||
|
return False
|
||
|
else:
|
||
|
return True
|
||
|
|
||
|
def check_rev_branch(component, repodir, rev, branch):
|
||
|
try:
|
||
|
actualbranch = runcmd("git branch --contains %s" % rev, repodir, printerr=False)
|
||
|
except subprocess.CalledProcessError as e:
|
||
|
if e.returncode == 129:
|
||
|
actualbranch = ""
|
||
|
else:
|
||
|
raise
|
||
|
|
||
|
if not actualbranch:
|
||
|
logger.error("%s: specified revision %s is invalid!" % (component, rev))
|
||
|
return False
|
||
|
|
||
|
branches = []
|
||
|
branchlist = actualbranch.split("\n")
|
||
|
for b in branchlist:
|
||
|
branches.append(b.strip().split(' ')[-1])
|
||
|
|
||
|
if branch not in branches:
|
||
|
logger.error("%s: specified revision %s is not on specified branch %s!" % (component, rev, branch))
|
||
|
return False
|
||
|
return True
|
||
|
|
||
|
def get_repos(conf, repo_names):
|
||
|
repos = []
|
||
|
for name in repo_names:
|
||
|
if name.startswith('-'):
|
||
|
break
|
||
|
else:
|
||
|
repos.append(name)
|
||
|
for repo in repos:
|
||
|
if not repo in conf.repos:
|
||
|
logger.error("Specified component '%s' not found in configuration" % repo)
|
||
|
sys.exit(1)
|
||
|
|
||
|
if not repos:
|
||
|
repos = [ repo for repo in conf.repos if conf.repos[repo].get("update", True) ]
|
||
|
|
||
|
return repos
|
||
|
|
||
|
def action_pull(conf, args):
|
||
|
"""
|
||
|
update the component repos only
|
||
|
"""
|
||
|
repos = get_repos(conf, args[1:])
|
||
|
|
||
|
# make sure all repos are clean
|
||
|
for name in repos:
|
||
|
check_repo_clean(conf.repos[name]['local_repo_dir'])
|
||
|
|
||
|
for name in repos:
|
||
|
repo = conf.repos[name]
|
||
|
ldir = repo['local_repo_dir']
|
||
|
branch = repo.get('branch', "master")
|
||
|
logger.info("update branch %s of component repo %s in %s ..." % (branch, name, ldir))
|
||
|
if not conf.hard_reset:
|
||
|
# Try to pull only the configured branch. Beware that this may fail
|
||
|
# when the branch is currently unknown (for example, after reconfiguring
|
||
|
# combo-layer). In that case we need to fetch everything and try the check out
|
||
|
# and pull again.
|
||
|
try:
|
||
|
runcmd("git checkout %s" % branch, ldir, printerr=False)
|
||
|
except subprocess.CalledProcessError:
|
||
|
output=runcmd("git fetch", ldir)
|
||
|
logger.info(output)
|
||
|
runcmd("git checkout %s" % branch, ldir)
|
||
|
runcmd("git pull --ff-only", ldir)
|
||
|
else:
|
||
|
output=runcmd("git pull --ff-only", ldir)
|
||
|
logger.info(output)
|
||
|
else:
|
||
|
output=runcmd("git fetch", ldir)
|
||
|
logger.info(output)
|
||
|
runcmd("git checkout %s" % branch, ldir)
|
||
|
runcmd("git reset --hard FETCH_HEAD", ldir)
|
||
|
|
||
|
def action_update(conf, args):
|
||
|
"""
|
||
|
update the component repos
|
||
|
either:
|
||
|
generate the patch list
|
||
|
apply the generated patches
|
||
|
or:
|
||
|
re-creates the entire component history and merges them
|
||
|
into the current branch with a merge commit
|
||
|
"""
|
||
|
components = [arg.split(':')[0] for arg in args[1:]]
|
||
|
revisions = {}
|
||
|
for arg in args[1:]:
|
||
|
if ':' in arg:
|
||
|
a = arg.split(':', 1)
|
||
|
revisions[a[0]] = a[1]
|
||
|
repos = get_repos(conf, components)
|
||
|
|
||
|
# make sure combo repo is clean
|
||
|
check_repo_clean(os.getcwd())
|
||
|
|
||
|
# Check whether we keep the component histories. Must be
|
||
|
# set either via --history command line parameter or consistently
|
||
|
# in combo-layer.conf. Mixing modes is (currently, and probably
|
||
|
# permanently because it would be complicated) not supported.
|
||
|
if conf.history:
|
||
|
history = True
|
||
|
else:
|
||
|
history = None
|
||
|
for name in repos:
|
||
|
repo = conf.repos[name]
|
||
|
repo_history = repo.get('history', False)
|
||
|
if history is None:
|
||
|
history = repo_history
|
||
|
elif history != repo_history:
|
||
|
logger.error("'history' property is set inconsistently")
|
||
|
sys.exit(1)
|
||
|
|
||
|
# Step 1: update the component repos
|
||
|
if conf.nopull:
|
||
|
logger.info("Skipping pull (-n)")
|
||
|
else:
|
||
|
action_pull(conf, ['arg0'] + components)
|
||
|
|
||
|
if history:
|
||
|
update_with_history(conf, components, revisions, repos)
|
||
|
else:
|
||
|
update_with_patches(conf, components, revisions, repos)
|
||
|
|
||
|
def update_with_patches(conf, components, revisions, repos):
|
||
|
import uuid
|
||
|
patch_dir = "patch-%s" % uuid.uuid4()
|
||
|
if not os.path.exists(patch_dir):
|
||
|
os.mkdir(patch_dir)
|
||
|
|
||
|
for name in repos:
|
||
|
revision = revisions.get(name, None)
|
||
|
repo = conf.repos[name]
|
||
|
ldir = repo['local_repo_dir']
|
||
|
dest_dir = repo['dest_dir']
|
||
|
branch = repo.get('branch', "master")
|
||
|
repo_patch_dir = os.path.join(os.getcwd(), patch_dir, name)
|
||
|
|
||
|
# Step 2: generate the patch list and store to patch dir
|
||
|
logger.info("Generating patches from %s..." % name)
|
||
|
top_revision = revision or branch
|
||
|
if not check_rev_branch(name, ldir, top_revision, branch):
|
||
|
sys.exit(1)
|
||
|
if dest_dir != ".":
|
||
|
prefix = "--src-prefix=a/%s/ --dst-prefix=b/%s/" % (dest_dir, dest_dir)
|
||
|
else:
|
||
|
prefix = ""
|
||
|
if repo['last_revision'] == "":
|
||
|
logger.info("Warning: last_revision of component %s is not set, starting from the first commit" % name)
|
||
|
patch_cmd_range = "--root %s" % top_revision
|
||
|
rev_cmd_range = top_revision
|
||
|
else:
|
||
|
if not check_rev_branch(name, ldir, repo['last_revision'], branch):
|
||
|
sys.exit(1)
|
||
|
patch_cmd_range = "%s..%s" % (repo['last_revision'], top_revision)
|
||
|
rev_cmd_range = patch_cmd_range
|
||
|
|
||
|
file_filter = repo.get('file_filter',".")
|
||
|
|
||
|
# Filter out unwanted files
|
||
|
exclude = repo.get('file_exclude', '')
|
||
|
if exclude:
|
||
|
for path in exclude.split():
|
||
|
p = "%s/%s" % (dest_dir, path) if dest_dir != '.' else path
|
||
|
file_filter += " ':!%s'" % p
|
||
|
|
||
|
patch_cmd = "git format-patch -N %s --output-directory %s %s -- %s" % \
|
||
|
(prefix,repo_patch_dir, patch_cmd_range, file_filter)
|
||
|
output = runcmd(patch_cmd, ldir)
|
||
|
logger.debug("generated patch set:\n%s" % output)
|
||
|
patchlist = output.splitlines()
|
||
|
|
||
|
rev_cmd = "git rev-list --no-merges %s -- %s" % (rev_cmd_range, file_filter)
|
||
|
revlist = runcmd(rev_cmd, ldir).splitlines()
|
||
|
|
||
|
# Step 3: Call repo specific hook to adjust patch
|
||
|
if 'hook' in repo:
|
||
|
# hook parameter is: ./hook patchpath revision reponame
|
||
|
count=len(revlist)-1
|
||
|
for patch in patchlist:
|
||
|
runcmd("%s %s %s %s" % (repo['hook'], patch, revlist[count], name))
|
||
|
count=count-1
|
||
|
|
||
|
# Step 4: write patch list and revision list to file, for user to edit later
|
||
|
patchlist_file = os.path.join(os.getcwd(), patch_dir, "patchlist-%s" % name)
|
||
|
repo['patchlist'] = patchlist_file
|
||
|
f = open(patchlist_file, 'w')
|
||
|
count=len(revlist)-1
|
||
|
for patch in patchlist:
|
||
|
f.write("%s %s\n" % (patch, revlist[count]))
|
||
|
check_patch(os.path.join(patch_dir, patch))
|
||
|
count=count-1
|
||
|
f.close()
|
||
|
|
||
|
# Step 5: invoke bash for user to edit patch and patch list
|
||
|
if conf.interactive:
|
||
|
print('You may now edit the patch and patch list in %s\n' \
|
||
|
'For example, you can remove unwanted patch entries from patchlist-*, so that they will be not applied later' % patch_dir);
|
||
|
if not drop_to_shell(patch_dir):
|
||
|
sys.exit(1)
|
||
|
|
||
|
# Step 6: apply the generated and revised patch
|
||
|
apply_patchlist(conf, repos)
|
||
|
runcmd("rm -rf %s" % patch_dir)
|
||
|
|
||
|
# Step 7: commit the updated config file if it's being tracked
|
||
|
commit_conf_file(conf, components)
|
||
|
|
||
|
def conf_commit_msg(conf, components):
|
||
|
# create the "components" string
|
||
|
component_str = "all components"
|
||
|
if len(components) > 0:
|
||
|
# otherwise tell which components were actually changed
|
||
|
component_str = ", ".join(components)
|
||
|
|
||
|
# expand the template with known values
|
||
|
template = Template(conf.commit_msg_template)
|
||
|
msg = template.substitute(components = component_str)
|
||
|
return msg
|
||
|
|
||
|
def commit_conf_file(conf, components, commit=True):
|
||
|
relpath = os.path.relpath(conf.conffile)
|
||
|
try:
|
||
|
output = runcmd("git status --porcelain %s" % relpath, printerr=False)
|
||
|
except:
|
||
|
# Outside the repository
|
||
|
output = None
|
||
|
if output:
|
||
|
if output.lstrip().startswith("M"):
|
||
|
logger.info("Committing updated configuration file")
|
||
|
if commit:
|
||
|
msg = conf_commit_msg(conf, components)
|
||
|
runcmd('git commit -m'.split() + [msg, relpath])
|
||
|
else:
|
||
|
runcmd('git add %s' % relpath)
|
||
|
return True
|
||
|
return False
|
||
|
|
||
|
def apply_patchlist(conf, repos):
|
||
|
"""
|
||
|
apply the generated patch list to combo repo
|
||
|
"""
|
||
|
for name in repos:
|
||
|
repo = conf.repos[name]
|
||
|
lastrev = repo["last_revision"]
|
||
|
prevrev = lastrev
|
||
|
|
||
|
# Get non-blank lines from patch list file
|
||
|
patchlist = []
|
||
|
if os.path.exists(repo['patchlist']) or not conf.interactive:
|
||
|
# Note: we want this to fail here if the file doesn't exist and we're not in
|
||
|
# interactive mode since the file should exist in this case
|
||
|
with open(repo['patchlist']) as f:
|
||
|
for line in f:
|
||
|
line = line.rstrip()
|
||
|
if line:
|
||
|
patchlist.append(line)
|
||
|
|
||
|
ldir = conf.repos[name]['local_repo_dir']
|
||
|
branch = conf.repos[name].get('branch', "master")
|
||
|
branchrev = runcmd("git rev-parse %s" % branch, ldir).strip()
|
||
|
|
||
|
if patchlist:
|
||
|
logger.info("Applying patches from %s..." % name)
|
||
|
linecount = len(patchlist)
|
||
|
i = 1
|
||
|
for line in patchlist:
|
||
|
patchfile = line.split()[0]
|
||
|
lastrev = line.split()[1]
|
||
|
patchdisp = os.path.relpath(patchfile)
|
||
|
if os.path.getsize(patchfile) == 0:
|
||
|
logger.info("(skipping %d/%d %s - no changes)" % (i, linecount, patchdisp))
|
||
|
else:
|
||
|
cmd = "git am --keep-cr %s-p1 %s" % ('-s ' if repo.get('signoff', True) else '', patchfile)
|
||
|
logger.info("Applying %d/%d: %s" % (i, linecount, patchdisp))
|
||
|
try:
|
||
|
runcmd(cmd)
|
||
|
except subprocess.CalledProcessError:
|
||
|
logger.info('Running "git am --abort" to cleanup repo')
|
||
|
runcmd("git am --abort")
|
||
|
logger.error('"%s" failed' % cmd)
|
||
|
logger.info("Please manually apply patch %s" % patchdisp)
|
||
|
logger.info("Note: if you exit and continue applying without manually applying the patch, it will be skipped")
|
||
|
if not drop_to_shell():
|
||
|
if prevrev != repo['last_revision']:
|
||
|
conf.update(name, "last_revision", prevrev)
|
||
|
sys.exit(1)
|
||
|
prevrev = lastrev
|
||
|
i += 1
|
||
|
# Once all patches are applied, we should update
|
||
|
# last_revision to the branch head instead of the last
|
||
|
# applied patch. The two are not necessarily the same when
|
||
|
# the last commit is a merge commit or when the patches at
|
||
|
# the branch head were intentionally excluded.
|
||
|
#
|
||
|
# If we do not do that for a merge commit, the next
|
||
|
# combo-layer run will only exclude patches reachable from
|
||
|
# one of the merged branches and try to re-apply patches
|
||
|
# from other branches even though they were already
|
||
|
# copied.
|
||
|
#
|
||
|
# If patches were intentionally excluded, the next run will
|
||
|
# present them again instead of skipping over them. This
|
||
|
# may or may not be intended, so the code here is conservative
|
||
|
# and only addresses the "head is merge commit" case.
|
||
|
if lastrev != branchrev and \
|
||
|
len(runcmd("git show --pretty=format:%%P --no-patch %s" % branch, ldir).split()) > 1:
|
||
|
lastrev = branchrev
|
||
|
else:
|
||
|
logger.info("No patches to apply from %s" % name)
|
||
|
lastrev = branchrev
|
||
|
|
||
|
if lastrev != repo['last_revision']:
|
||
|
conf.update(name, "last_revision", lastrev)
|
||
|
|
||
|
def action_splitpatch(conf, args):
|
||
|
"""
|
||
|
generate the commit patch and
|
||
|
split the patch per repo
|
||
|
"""
|
||
|
logger.debug("action_splitpatch")
|
||
|
if len(args) > 1:
|
||
|
commit = args[1]
|
||
|
else:
|
||
|
commit = "HEAD"
|
||
|
patchdir = "splitpatch-%s" % commit
|
||
|
if not os.path.exists(patchdir):
|
||
|
os.mkdir(patchdir)
|
||
|
|
||
|
# filerange_root is for the repo whose dest_dir is root "."
|
||
|
# and it should be specified by excluding all other repo dest dir
|
||
|
# like "-x repo1 -x repo2 -x repo3 ..."
|
||
|
filerange_root = ""
|
||
|
for name in conf.repos:
|
||
|
dest_dir = conf.repos[name]['dest_dir']
|
||
|
if dest_dir != ".":
|
||
|
filerange_root = '%s -x "%s/*"' % (filerange_root, dest_dir)
|
||
|
|
||
|
for name in conf.repos:
|
||
|
dest_dir = conf.repos[name]['dest_dir']
|
||
|
patch_filename = "%s/%s.patch" % (patchdir, name)
|
||
|
if dest_dir == ".":
|
||
|
cmd = "git format-patch -n1 --stdout %s^..%s | filterdiff -p1 %s > %s" % (commit, commit, filerange_root, patch_filename)
|
||
|
else:
|
||
|
cmd = "git format-patch --no-prefix -n1 --stdout %s^..%s -- %s > %s" % (commit, commit, dest_dir, patch_filename)
|
||
|
runcmd(cmd)
|
||
|
# Detect empty patches (including those produced by filterdiff above
|
||
|
# that contain only preamble text)
|
||
|
if os.path.getsize(patch_filename) == 0 or runcmd("filterdiff %s" % patch_filename) == "":
|
||
|
os.remove(patch_filename)
|
||
|
logger.info("(skipping %s - no changes)", name)
|
||
|
else:
|
||
|
logger.info(patch_filename)
|
||
|
|
||
|
def update_with_history(conf, components, revisions, repos):
|
||
|
'''Update all components with full history.
|
||
|
|
||
|
Works by importing all commits reachable from a component's
|
||
|
current head revision. If those commits are rooted in an already
|
||
|
imported commit, their content gets mixed with the content of the
|
||
|
combined repo of that commit (new or modified files overwritten,
|
||
|
removed files removed).
|
||
|
|
||
|
The last commit is an artificial merge commit that merges all the
|
||
|
updated components into the combined repository.
|
||
|
|
||
|
The HEAD ref only gets updated at the very end. All intermediate work
|
||
|
happens in a worktree which will get garbage collected by git eventually
|
||
|
after a failure.
|
||
|
'''
|
||
|
# Remember current HEAD and what we need to add to it.
|
||
|
head = runcmd("git rev-parse HEAD").strip()
|
||
|
additional_heads = {}
|
||
|
|
||
|
# Track the mapping between original commit and commit in the
|
||
|
# combined repo. We do not have to distinguish between components,
|
||
|
# because commit hashes are different anyway. Often we can
|
||
|
# skip find_revs() entirely (for example, when all new commits
|
||
|
# are derived from the last imported revision).
|
||
|
#
|
||
|
# Using "head" (typically the merge commit) instead of the actual
|
||
|
# commit for the component leads to a nicer history in the combined
|
||
|
# repo.
|
||
|
old2new_revs = {}
|
||
|
for name in repos:
|
||
|
repo = conf.repos[name]
|
||
|
revision = repo['last_revision']
|
||
|
if revision:
|
||
|
old2new_revs[revision] = head
|
||
|
|
||
|
def add_p(parents):
|
||
|
'''Insert -p before each entry.'''
|
||
|
parameters = []
|
||
|
for p in parents:
|
||
|
parameters.append('-p')
|
||
|
parameters.append(p)
|
||
|
return parameters
|
||
|
|
||
|
# Do all intermediate work with a separate work dir and index,
|
||
|
# chosen via env variables (can't use "git worktree", it is too
|
||
|
# new). This is useful (no changes to current work tree unless the
|
||
|
# update succeeds) and required (otherwise we end up temporarily
|
||
|
# removing the combo-layer hooks that we currently use when
|
||
|
# importing a new component).
|
||
|
#
|
||
|
# Not cleaned up after a failure at the moment.
|
||
|
wdir = os.path.join(os.getcwd(), ".git", "combo-layer")
|
||
|
windex = wdir + ".index"
|
||
|
if os.path.isdir(wdir):
|
||
|
shutil.rmtree(wdir)
|
||
|
os.mkdir(wdir)
|
||
|
wenv = copy.deepcopy(os.environ)
|
||
|
wenv["GIT_WORK_TREE"] = wdir
|
||
|
wenv["GIT_INDEX_FILE"] = windex
|
||
|
# This one turned out to be needed in practice.
|
||
|
wenv["GIT_OBJECT_DIRECTORY"] = os.path.join(os.getcwd(), ".git", "objects")
|
||
|
wargs = {"destdir": wdir, "env": wenv}
|
||
|
|
||
|
for name in repos:
|
||
|
revision = revisions.get(name, None)
|
||
|
repo = conf.repos[name]
|
||
|
ldir = repo['local_repo_dir']
|
||
|
dest_dir = repo['dest_dir']
|
||
|
branch = repo.get('branch', "master")
|
||
|
hook = repo.get('hook', None)
|
||
|
largs = {"destdir": ldir, "env": None}
|
||
|
file_include = repo.get('file_filter', '').split()
|
||
|
file_include.sort() # make sure that short entries like '.' come first.
|
||
|
file_exclude = repo.get('file_exclude', '').split()
|
||
|
|
||
|
def include_file(file):
|
||
|
if not file_include:
|
||
|
# No explicit filter set, include file.
|
||
|
return True
|
||
|
for filter in file_include:
|
||
|
if filter == '.':
|
||
|
# Another special case: include current directory and thus all files.
|
||
|
return True
|
||
|
if os.path.commonprefix((filter, file)) == filter:
|
||
|
# Included in directory or direct file match.
|
||
|
return True
|
||
|
# Check for wildcard match *with* allowing * to match /, i.e.
|
||
|
# src/*.c does match src/foobar/*.c. That's not how it is done elsewhere
|
||
|
# when passing the filtering to "git archive", but it is unclear what
|
||
|
# the intended semantic is (the comment on file_exclude that "append a * wildcard
|
||
|
# at the end" to match the full content of a directories implies that
|
||
|
# slashes are indeed not special), so here we simply do what's easy to
|
||
|
# implement in Python.
|
||
|
logger.debug('fnmatch(%s, %s)' % (file, filter))
|
||
|
if fnmatch.fnmatchcase(file, filter):
|
||
|
return True
|
||
|
return False
|
||
|
|
||
|
def exclude_file(file):
|
||
|
for filter in file_exclude:
|
||
|
if fnmatch.fnmatchcase(file, filter):
|
||
|
return True
|
||
|
return False
|
||
|
|
||
|
def file_filter(files):
|
||
|
'''Clean up file list so that only included files remain.'''
|
||
|
index = 0
|
||
|
while index < len(files):
|
||
|
file = files[index]
|
||
|
if not include_file(file) or exclude_file(file):
|
||
|
del files[index]
|
||
|
else:
|
||
|
index += 1
|
||
|
|
||
|
|
||
|
# Generate the revision list.
|
||
|
logger.info("Analyzing commits from %s..." % name)
|
||
|
top_revision = revision or branch
|
||
|
if not check_rev_branch(name, ldir, top_revision, branch):
|
||
|
sys.exit(1)
|
||
|
|
||
|
last_revision = repo['last_revision']
|
||
|
rev_list_args = "--full-history --sparse --topo-order --reverse"
|
||
|
if not last_revision:
|
||
|
logger.info("Warning: last_revision of component %s is not set, starting from the first commit" % name)
|
||
|
rev_list_args = rev_list_args + ' ' + top_revision
|
||
|
else:
|
||
|
if not check_rev_branch(name, ldir, last_revision, branch):
|
||
|
sys.exit(1)
|
||
|
rev_list_args = "%s %s..%s" % (rev_list_args, last_revision, top_revision)
|
||
|
|
||
|
# By definition, the current HEAD contains the latest imported
|
||
|
# commit of each component. We use that as initial mapping even
|
||
|
# though the commits do not match exactly because
|
||
|
# a) it always works (in contrast to find_revs, which relies on special
|
||
|
# commit messages)
|
||
|
# b) it is faster than find_revs, which will only be called on demand
|
||
|
# and can be skipped entirely in most cases
|
||
|
# c) last but not least, the combined history looks nicer when all
|
||
|
# new commits are rooted in the same merge commit
|
||
|
old2new_revs[last_revision] = head
|
||
|
|
||
|
# We care about all commits (--full-history and --sparse) and
|
||
|
# we want reconstruct the topology and thus do not care
|
||
|
# about ordering by time (--topo-order). We ask for the ones
|
||
|
# we need to import first to be listed first (--reverse).
|
||
|
revs = runcmd("git rev-list %s" % rev_list_args, **largs).split()
|
||
|
logger.debug("To be imported: %s" % revs)
|
||
|
# Now 'revs' contains all revisions reachable from the top revision.
|
||
|
# All revisions derived from the 'last_revision' definitely are new,
|
||
|
# whereas the others may or may not have been imported before. For
|
||
|
# a linear history in the component, that second set will be empty.
|
||
|
# To distinguish between them, we also get the shorter list
|
||
|
# of revisions starting at the ancestor.
|
||
|
if last_revision:
|
||
|
ancestor_revs = runcmd("git rev-list --ancestry-path %s" % rev_list_args, **largs).split()
|
||
|
else:
|
||
|
ancestor_revs = []
|
||
|
logger.debug("Ancestors: %s" % ancestor_revs)
|
||
|
|
||
|
# Now import each revision.
|
||
|
logger.info("Importing commits from %s..." % name)
|
||
|
def import_rev(rev):
|
||
|
global scanned_revs
|
||
|
|
||
|
# If it is part of the new commits, we definitely need
|
||
|
# to import it. Otherwise we need to check, we might have
|
||
|
# imported it before. If it was imported and we merely
|
||
|
# fail to find it because commit messages did not track
|
||
|
# the mapping, then we end up importing it again. So
|
||
|
# combined repos using "updating with history" really should
|
||
|
# enable the "From ... rev:" commit header modifications.
|
||
|
if rev not in ancestor_revs and rev not in old2new_revs and not scanned_revs:
|
||
|
logger.debug("Revision %s triggers log analysis." % rev)
|
||
|
find_revs(old2new_revs, head)
|
||
|
scanned_revs = True
|
||
|
new_rev = old2new_revs.get(rev, None)
|
||
|
if new_rev:
|
||
|
return new_rev
|
||
|
|
||
|
# If the commit is not in the original list of revisions
|
||
|
# to be imported, then it must be a parent of one of those
|
||
|
# commits and it was skipped during earlier imports or not
|
||
|
# found. Importing such merge commits leads to very ugly
|
||
|
# history (long cascade of merge commits which all point
|
||
|
# to to older commits) when switching from "update via
|
||
|
# patches" to "update with history".
|
||
|
#
|
||
|
# We can avoid importing merge commits if all non-merge commits
|
||
|
# reachable from it were already imported. In that case we
|
||
|
# can root the new commits in the current head revision.
|
||
|
def is_imported(prev):
|
||
|
parents = runcmd("git show --no-patch --pretty=format:%P " + prev, **largs).split()
|
||
|
if len(parents) > 1:
|
||
|
for p in parents:
|
||
|
if not is_imported(p):
|
||
|
logger.debug("Must import %s because %s is not imported." % (rev, p))
|
||
|
return False
|
||
|
return True
|
||
|
elif prev in old2new_revs:
|
||
|
return True
|
||
|
else:
|
||
|
logger.debug("Must import %s because %s is not imported." % (rev, prev))
|
||
|
return False
|
||
|
if rev not in revs and is_imported(rev):
|
||
|
old2new_revs[rev] = head
|
||
|
return head
|
||
|
|
||
|
# Need to import rev. Collect some information about it.
|
||
|
logger.debug("Importing %s" % rev)
|
||
|
(parents, author_name, author_email, author_timestamp, body) = \
|
||
|
runcmd("git show --no-patch --pretty=format:%P%x00%an%x00%ae%x00%at%x00%B " + rev, **largs).split(chr(0))
|
||
|
parents = parents.split()
|
||
|
if parents:
|
||
|
# Arbitrarily pick the first parent as base. It may or may not have
|
||
|
# been imported before. For example, if the parent is a merge commit
|
||
|
# and previously the combined repository used patching as update
|
||
|
# method, then the actual merge commit parent never was imported.
|
||
|
# To cover this, We recursively import parents.
|
||
|
parent = parents[0]
|
||
|
new_parent = import_rev(parent)
|
||
|
# Clean index and working tree. TODO: can we combine this and the
|
||
|
# next into one command with less file IO?
|
||
|
# "git reset --hard" does not work, it changes HEAD of the parent
|
||
|
# repo, which we wanted to avoid. Probably need to keep
|
||
|
# track of the rev that corresponds to the index and use apply_commit().
|
||
|
runcmd("git rm -q --ignore-unmatch -rf .", **wargs)
|
||
|
# Update index and working tree to match the parent.
|
||
|
runcmd("git checkout -q -f %s ." % new_parent, **wargs)
|
||
|
else:
|
||
|
parent = None
|
||
|
# Clean index and working tree.
|
||
|
runcmd("git rm -q --ignore-unmatch -rf .", **wargs)
|
||
|
|
||
|
# Modify index and working tree such that it mirrors the commit.
|
||
|
apply_commit(parent, rev, largs, wargs, dest_dir, file_filter=file_filter)
|
||
|
|
||
|
# Now commit.
|
||
|
new_tree = runcmd("git write-tree", **wargs).strip()
|
||
|
env = copy.deepcopy(wenv)
|
||
|
env['GIT_AUTHOR_NAME'] = author_name
|
||
|
env['GIT_AUTHOR_EMAIL'] = author_email
|
||
|
env['GIT_AUTHOR_DATE'] = author_timestamp
|
||
|
if hook:
|
||
|
# Need to turn the verbatim commit message into something resembling a patch header
|
||
|
# for the hook.
|
||
|
with tempfile.NamedTemporaryFile(mode='wt', delete=False) as patch:
|
||
|
patch.write('Subject: [PATCH] ')
|
||
|
patch.write(body)
|
||
|
patch.write('\n---\n')
|
||
|
patch.close()
|
||
|
runcmd([hook, patch.name, rev, name])
|
||
|
with open(patch.name) as f:
|
||
|
body = f.read()[len('Subject: [PATCH] '):][:-len('\n---\n')]
|
||
|
|
||
|
# We can skip non-merge commits that did not change any files. Those are typically
|
||
|
# the result of file filtering, although they could also have been introduced
|
||
|
# intentionally upstream, in which case we drop some information here.
|
||
|
if len(parents) == 1:
|
||
|
parent_rev = import_rev(parents[0])
|
||
|
old_tree = runcmd("git show -s --pretty=format:%T " + parent_rev, **wargs).strip()
|
||
|
commit = old_tree != new_tree
|
||
|
if not commit:
|
||
|
new_rev = parent_rev
|
||
|
else:
|
||
|
commit = True
|
||
|
if commit:
|
||
|
new_rev = runcmd("git commit-tree".split() + add_p([import_rev(p) for p in parents]) +
|
||
|
["-m", body, new_tree],
|
||
|
env=env).strip()
|
||
|
old2new_revs[rev] = new_rev
|
||
|
|
||
|
return new_rev
|
||
|
|
||
|
if revs:
|
||
|
for rev in revs:
|
||
|
import_rev(rev)
|
||
|
# Remember how to update our current head. New components get added,
|
||
|
# updated components get the delta between current head and the updated component
|
||
|
# applied.
|
||
|
additional_heads[old2new_revs[revs[-1]]] = head if repo['last_revision'] else None
|
||
|
repo['last_revision'] = revs[-1]
|
||
|
|
||
|
# Now construct the final merge commit. We create the tree by
|
||
|
# starting with the head and applying the changes from each
|
||
|
# components imported head revision.
|
||
|
if additional_heads:
|
||
|
runcmd("git reset --hard", **wargs)
|
||
|
for rev, base in additional_heads.items():
|
||
|
apply_commit(base, rev, wargs, wargs, None)
|
||
|
|
||
|
# Commit with all component branches as parents as well as the previous head.
|
||
|
logger.info("Writing final merge commit...")
|
||
|
msg = conf_commit_msg(conf, components)
|
||
|
new_tree = runcmd("git write-tree", **wargs).strip()
|
||
|
new_rev = runcmd("git commit-tree".split() +
|
||
|
add_p([head] + list(additional_heads.keys())) +
|
||
|
["-m", msg, new_tree],
|
||
|
**wargs).strip()
|
||
|
# And done! This is the first time we change the HEAD in the actual work tree.
|
||
|
runcmd("git reset --hard %s" % new_rev)
|
||
|
|
||
|
# Update and stage the (potentially modified)
|
||
|
# combo-layer.conf, but do not commit separately.
|
||
|
for name in repos:
|
||
|
repo = conf.repos[name]
|
||
|
rev = repo['last_revision']
|
||
|
conf.update(name, "last_revision", rev)
|
||
|
if commit_conf_file(conf, components, False):
|
||
|
# Must augment the previous commit.
|
||
|
runcmd("git commit --amend -C HEAD")
|
||
|
|
||
|
|
||
|
scanned_revs = False
|
||
|
def find_revs(old2new, head):
|
||
|
'''Construct mapping from original commit hash to commit hash in
|
||
|
combined repo by looking at the commit messages. Depends on the
|
||
|
"From ... rev: ..." convention.'''
|
||
|
logger.info("Analyzing log messages to find previously imported commits...")
|
||
|
num_known = len(old2new)
|
||
|
log = runcmd("git log --grep='From .* rev: [a-fA-F0-9][a-fA-F0-9]*' --pretty=format:%H%x00%B%x00 " + head).split(chr(0))
|
||
|
regex = re.compile(r'From .* rev: ([a-fA-F0-9]+)')
|
||
|
for new_rev, body in zip(*[iter(log)]* 2):
|
||
|
# Use the last one, in the unlikely case there are more than one.
|
||
|
rev = regex.findall(body)[-1]
|
||
|
if rev not in old2new:
|
||
|
old2new[rev] = new_rev.strip()
|
||
|
logger.info("Found %d additional commits, leading to: %s" % (len(old2new) - num_known, old2new))
|
||
|
|
||
|
|
||
|
def apply_commit(parent, rev, largs, wargs, dest_dir, file_filter=None):
|
||
|
'''Compare revision against parent, remove files deleted in the
|
||
|
commit, re-write new or modified ones. Moves them into dest_dir.
|
||
|
Optionally filters files.
|
||
|
'''
|
||
|
if not dest_dir:
|
||
|
dest_dir = "."
|
||
|
# -r recurses into sub-directories, given is the full overview of
|
||
|
# what changed. We do not care about copy/edits or renames, so we
|
||
|
# can disable those with --no-renames (but we still parse them,
|
||
|
# because it was not clear from git documentation whether C and M
|
||
|
# lines can still occur).
|
||
|
logger.debug("Applying changes between %s and %s in %s" % (parent, rev, largs["destdir"]))
|
||
|
delete = []
|
||
|
update = []
|
||
|
if parent:
|
||
|
# Apply delta.
|
||
|
changes = runcmd("git diff-tree --no-commit-id --no-renames --name-status -r --raw -z %s %s" % (parent, rev), **largs).split(chr(0))
|
||
|
for status, name in zip(*[iter(changes)]*2):
|
||
|
if status[0] in "ACMRT":
|
||
|
update.append(name)
|
||
|
elif status[0] in "D":
|
||
|
delete.append(name)
|
||
|
else:
|
||
|
logger.error("Unknown status %s of file %s in revision %s" % (status, name, rev))
|
||
|
sys.exit(1)
|
||
|
else:
|
||
|
# Copy all files.
|
||
|
update.extend(runcmd("git ls-tree -r --name-only -z %s" % rev, **largs).split(chr(0)))
|
||
|
|
||
|
# Include/exclude files as define in the component config.
|
||
|
# Both updated and deleted file lists get filtered, because it might happen
|
||
|
# that a file gets excluded, pulled from a different component, and then the
|
||
|
# excluded file gets deleted. In that case we must keep the copy.
|
||
|
if file_filter:
|
||
|
file_filter(update)
|
||
|
file_filter(delete)
|
||
|
|
||
|
# We export into a tar archive here and extract with tar because it is simple (no
|
||
|
# need to implement file and symlink writing ourselves) and gives us some degree
|
||
|
# of parallel IO. The downside is that we have to pass the list of files via
|
||
|
# command line parameters - hopefully there will never be too many at once.
|
||
|
if update:
|
||
|
target = os.path.join(wargs["destdir"], dest_dir)
|
||
|
if not os.path.isdir(target):
|
||
|
os.makedirs(target)
|
||
|
quoted_target = pipes.quote(target)
|
||
|
# os.sysconf('SC_ARG_MAX') is lying: running a command with
|
||
|
# string length 629343 already failed with "Argument list too
|
||
|
# long" although SC_ARG_MAX = 2097152. "man execve" explains
|
||
|
# the limitations, but those are pretty complicated. So here
|
||
|
# we just hard-code a fixed value which is more likely to work.
|
||
|
max_cmdsize = 64 * 1024
|
||
|
while update:
|
||
|
quoted_args = []
|
||
|
unquoted_args = []
|
||
|
cmdsize = 100 + len(quoted_target)
|
||
|
while update:
|
||
|
quoted_next = pipes.quote(update[0])
|
||
|
size_next = len(quoted_next) + len(dest_dir) + 1
|
||
|
logger.debug('cmdline length %d + %d < %d?' % (cmdsize, size_next, os.sysconf('SC_ARG_MAX')))
|
||
|
if cmdsize + size_next < max_cmdsize:
|
||
|
quoted_args.append(quoted_next)
|
||
|
unquoted_args.append(update.pop(0))
|
||
|
cmdsize += size_next
|
||
|
else:
|
||
|
logger.debug('Breaking the cmdline at length %d' % cmdsize)
|
||
|
break
|
||
|
logger.debug('Final cmdline length %d / %d' % (cmdsize, os.sysconf('SC_ARG_MAX')))
|
||
|
cmd = "git archive %s %s | tar -C %s -xf -" % (rev, ' '.join(quoted_args), quoted_target)
|
||
|
logger.debug('First cmdline length %d' % len(cmd))
|
||
|
runcmd(cmd, **largs)
|
||
|
cmd = "git add -f".split() + [os.path.join(dest_dir, x) for x in unquoted_args]
|
||
|
logger.debug('Second cmdline length %d' % reduce(lambda x, y: x + len(y), cmd, 0))
|
||
|
runcmd(cmd, **wargs)
|
||
|
if delete:
|
||
|
for path in delete:
|
||
|
if dest_dir:
|
||
|
path = os.path.join(dest_dir, path)
|
||
|
runcmd("git rm -f --ignore-unmatch".split() + [os.path.join(dest_dir, x) for x in delete], **wargs)
|
||
|
|
||
|
def action_error(conf, args):
|
||
|
logger.info("invalid action %s" % args[0])
|
||
|
|
||
|
actions = {
|
||
|
"init": action_init,
|
||
|
"update": action_update,
|
||
|
"pull": action_pull,
|
||
|
"splitpatch": action_splitpatch,
|
||
|
}
|
||
|
|
||
|
def main():
|
||
|
parser = optparse.OptionParser(
|
||
|
version = "Combo Layer Repo Tool version %s" % __version__,
|
||
|
usage = """%prog [options] action
|
||
|
|
||
|
Create and update a combination layer repository from multiple component repositories.
|
||
|
|
||
|
Action:
|
||
|
init initialise the combo layer repo
|
||
|
update [components] get patches from component repos and apply them to the combo repo
|
||
|
pull [components] just pull component repos only
|
||
|
splitpatch [commit] generate commit patch and split per component, default commit is HEAD""")
|
||
|
|
||
|
parser.add_option("-c", "--conf", help = "specify the config file (conf/combo-layer.conf is the default).",
|
||
|
action = "store", dest = "conffile", default = "conf/combo-layer.conf")
|
||
|
|
||
|
parser.add_option("-i", "--interactive", help = "interactive mode, user can edit the patch list and patches",
|
||
|
action = "store_true", dest = "interactive", default = False)
|
||
|
|
||
|
parser.add_option("-D", "--debug", help = "output debug information",
|
||
|
action = "store_true", dest = "debug", default = False)
|
||
|
|
||
|
parser.add_option("-n", "--no-pull", help = "skip pulling component repos during update",
|
||
|
action = "store_true", dest = "nopull", default = False)
|
||
|
|
||
|
parser.add_option("--hard-reset",
|
||
|
help = "instead of pull do fetch and hard-reset in component repos",
|
||
|
action = "store_true", dest = "hard_reset", default = False)
|
||
|
|
||
|
parser.add_option("-H", "--history", help = "import full history of components during init",
|
||
|
action = "store_true", default = False)
|
||
|
|
||
|
options, args = parser.parse_args(sys.argv)
|
||
|
|
||
|
# Dispatch to action handler
|
||
|
if len(args) == 1:
|
||
|
logger.error("No action specified, exiting")
|
||
|
parser.print_help()
|
||
|
elif args[1] not in actions:
|
||
|
logger.error("Unsupported action %s, exiting\n" % (args[1]))
|
||
|
parser.print_help()
|
||
|
elif not os.path.exists(options.conffile):
|
||
|
logger.error("No valid config file, exiting\n")
|
||
|
parser.print_help()
|
||
|
else:
|
||
|
if options.debug:
|
||
|
logger.setLevel(logging.DEBUG)
|
||
|
confdata = Configuration(options)
|
||
|
initmode = (args[1] == 'init')
|
||
|
confdata.sanity_check(initmode)
|
||
|
actions.get(args[1], action_error)(confdata, args[1:])
|
||
|
|
||
|
if __name__ == "__main__":
|
||
|
try:
|
||
|
ret = main()
|
||
|
except Exception:
|
||
|
ret = 1
|
||
|
import traceback
|
||
|
traceback.print_exc()
|
||
|
sys.exit(ret)
|