2018-09-16 17:24:07 +00:00
|
|
|
#!/usr/bin/env python
|
|
|
|
|
2018-09-14 05:02:16 +00:00
|
|
|
"""Git helper functions.
|
|
|
|
|
2018-09-16 17:24:07 +00:00
|
|
|
Everything here should be project agnostic: it shouldn't rely on project's
|
|
|
|
structure, or make assumptions about the passed arguments or calls' outcomes.
|
2018-09-14 05:02:16 +00:00
|
|
|
"""
|
|
|
|
|
2020-10-30 10:05:38 +00:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
import io
|
2018-09-14 05:02:16 +00:00
|
|
|
import os
|
2020-10-30 10:05:38 +00:00
|
|
|
import posixpath
|
2020-04-08 15:59:14 +00:00
|
|
|
import re
|
2018-09-14 05:02:16 +00:00
|
|
|
import subprocess
|
2020-04-08 15:59:14 +00:00
|
|
|
import sys
|
2018-09-14 05:02:16 +00:00
|
|
|
|
|
|
|
|
|
|
|
def is_repo_root(path):
|
|
|
|
path_exists = os.path.exists(path)
|
|
|
|
if not path_exists:
|
|
|
|
return False
|
|
|
|
|
|
|
|
git_folder_path = os.path.join(path, '.git')
|
|
|
|
git_folder_exists = os.path.exists(git_folder_path)
|
|
|
|
|
|
|
|
return git_folder_exists
|
|
|
|
|
|
|
|
|
|
|
|
def get_repo_root(path):
|
|
|
|
"""Finds a closest ancestor folder which is a repo root."""
|
|
|
|
norm_path = os.path.normpath(path)
|
|
|
|
norm_path_exists = os.path.exists(norm_path)
|
|
|
|
if not norm_path_exists:
|
|
|
|
return None
|
|
|
|
|
|
|
|
if is_repo_root(norm_path):
|
|
|
|
return norm_path
|
|
|
|
|
|
|
|
parent_path = os.path.dirname(norm_path)
|
|
|
|
|
|
|
|
# Check if we're in the root folder already.
|
|
|
|
if parent_path == norm_path:
|
|
|
|
return None
|
|
|
|
|
|
|
|
return get_repo_root(parent_path)
|
|
|
|
|
|
|
|
|
2019-04-03 19:42:49 +00:00
|
|
|
def am(repo, patch_data, threeway=False, directory=None, exclude=None,
|
2021-03-25 05:49:53 +00:00
|
|
|
committer_name=None, committer_email=None, keep_cr=True):
|
2018-10-24 18:24:11 +00:00
|
|
|
args = []
|
|
|
|
if threeway:
|
|
|
|
args += ['--3way']
|
2018-12-11 21:49:01 +00:00
|
|
|
if directory is not None:
|
|
|
|
args += ['--directory', directory]
|
2019-04-03 19:42:49 +00:00
|
|
|
if exclude is not None:
|
|
|
|
for path_pattern in exclude:
|
|
|
|
args += ['--exclude', path_pattern]
|
2021-03-25 05:49:53 +00:00
|
|
|
if keep_cr is True:
|
|
|
|
# Keep the CR of CRLF in case any patches target files with Windows line
|
|
|
|
# endings.
|
|
|
|
args += ['--keep-cr']
|
2019-04-03 19:42:49 +00:00
|
|
|
|
2018-10-24 18:24:11 +00:00
|
|
|
root_args = ['-C', repo]
|
|
|
|
if committer_name is not None:
|
|
|
|
root_args += ['-c', 'user.name=' + committer_name]
|
|
|
|
if committer_email is not None:
|
|
|
|
root_args += ['-c', 'user.email=' + committer_email]
|
2019-03-08 02:11:31 +00:00
|
|
|
root_args += ['-c', 'commit.gpgsign=false']
|
2018-10-24 18:24:11 +00:00
|
|
|
command = ['git'] + root_args + ['am'] + args
|
|
|
|
proc = subprocess.Popen(
|
|
|
|
command,
|
|
|
|
stdin=subprocess.PIPE)
|
2019-08-23 22:48:27 +00:00
|
|
|
proc.communicate(patch_data.encode('utf-8'))
|
2018-10-24 18:24:11 +00:00
|
|
|
if proc.returncode != 0:
|
|
|
|
raise RuntimeError("Command {} returned {}".format(command,
|
|
|
|
proc.returncode))
|
|
|
|
|
|
|
|
|
2018-09-16 17:24:07 +00:00
|
|
|
def apply_patch(repo, patch_path, directory=None, index=False, reverse=False):
|
2018-10-24 18:24:11 +00:00
|
|
|
args = ['git', '-C', repo, 'apply',
|
2018-09-14 05:02:16 +00:00
|
|
|
'--ignore-space-change',
|
|
|
|
'--ignore-whitespace',
|
|
|
|
'--whitespace', 'fix'
|
|
|
|
]
|
|
|
|
if directory:
|
|
|
|
args += ['--directory', directory]
|
|
|
|
if index:
|
|
|
|
args += ['--index']
|
|
|
|
if reverse:
|
|
|
|
args += ['--reverse']
|
|
|
|
args += ['--', patch_path]
|
|
|
|
|
2018-10-24 18:24:11 +00:00
|
|
|
return_code = subprocess.call(args)
|
|
|
|
applied_successfully = (return_code == 0)
|
|
|
|
return applied_successfully
|
2018-09-14 05:02:16 +00:00
|
|
|
|
|
|
|
|
2019-04-23 17:28:26 +00:00
|
|
|
def import_patches(repo, **kwargs):
|
|
|
|
"""same as am(), but we save the upstream HEAD so we can refer to it when we
|
|
|
|
later export patches"""
|
|
|
|
update_ref(
|
|
|
|
repo=repo,
|
|
|
|
ref='refs/patches/upstream-head',
|
|
|
|
newvalue='HEAD'
|
|
|
|
)
|
|
|
|
am(repo=repo, **kwargs)
|
|
|
|
|
|
|
|
|
2018-09-14 05:02:16 +00:00
|
|
|
def get_patch(repo, commit_hash):
|
2018-10-24 18:24:11 +00:00
|
|
|
args = ['git', '-C', repo, 'diff-tree',
|
2018-09-14 05:02:16 +00:00
|
|
|
'-p',
|
|
|
|
commit_hash,
|
2018-09-16 17:24:07 +00:00
|
|
|
'--' # Explicitly tell Git `commit_hash` is a revision, not a path.
|
2018-09-14 05:02:16 +00:00
|
|
|
]
|
|
|
|
|
2020-10-30 10:05:38 +00:00
|
|
|
return subprocess.check_output(args).decode('utf-8')
|
2018-09-14 05:02:16 +00:00
|
|
|
|
|
|
|
|
|
|
|
def get_head_commit(repo):
|
2018-10-24 18:24:11 +00:00
|
|
|
args = ['git', '-C', repo, 'rev-parse', 'HEAD']
|
2018-09-14 05:02:16 +00:00
|
|
|
|
2020-10-30 10:05:38 +00:00
|
|
|
return subprocess.check_output(args).decode('utf-8').strip()
|
2018-09-14 05:02:16 +00:00
|
|
|
|
|
|
|
|
2019-04-17 18:16:03 +00:00
|
|
|
def update_ref(repo, ref, newvalue):
|
|
|
|
args = ['git', '-C', repo, 'update-ref', ref, newvalue]
|
|
|
|
|
|
|
|
return subprocess.check_call(args)
|
|
|
|
|
|
|
|
|
2018-09-14 05:02:16 +00:00
|
|
|
def reset(repo):
|
2018-10-24 18:24:11 +00:00
|
|
|
args = ['git', '-C', repo, 'reset']
|
2018-09-14 05:02:16 +00:00
|
|
|
|
2018-10-24 18:24:11 +00:00
|
|
|
subprocess.check_call(args)
|
2018-09-14 05:02:16 +00:00
|
|
|
|
|
|
|
|
|
|
|
def commit(repo, author, message):
|
2020-04-08 15:59:14 +00:00
|
|
|
"""Commit whatever in the index is now."""
|
2018-09-14 05:02:16 +00:00
|
|
|
|
|
|
|
# Let's setup committer info so git won't complain about it being missing.
|
|
|
|
# TODO: Is there a better way to set committer's name and email?
|
|
|
|
env = os.environ.copy()
|
|
|
|
env['GIT_COMMITTER_NAME'] = 'Anonymous Committer'
|
|
|
|
env['GIT_COMMITTER_EMAIL'] = 'anonymous@electronjs.org'
|
|
|
|
|
2018-10-24 18:24:11 +00:00
|
|
|
args = ['git', '-C', repo, 'commit',
|
2018-09-14 05:02:16 +00:00
|
|
|
'--author', author,
|
|
|
|
'--message', message
|
|
|
|
]
|
|
|
|
|
2018-10-24 18:24:11 +00:00
|
|
|
return_code = subprocess.call(args, env=env)
|
|
|
|
committed_successfully = (return_code == 0)
|
|
|
|
return committed_successfully
|
2020-04-08 15:59:14 +00:00
|
|
|
|
|
|
|
def get_upstream_head(repo):
|
|
|
|
args = [
|
|
|
|
'git',
|
|
|
|
'-C',
|
|
|
|
repo,
|
|
|
|
'rev-parse',
|
|
|
|
'--verify',
|
|
|
|
'refs/patches/upstream-head',
|
|
|
|
]
|
2020-10-30 10:05:38 +00:00
|
|
|
return subprocess.check_output(args).decode('utf-8').strip()
|
2020-04-08 15:59:14 +00:00
|
|
|
|
|
|
|
def get_commit_count(repo, commit_range):
|
|
|
|
args = [
|
|
|
|
'git',
|
|
|
|
'-C',
|
|
|
|
repo,
|
|
|
|
'rev-list',
|
|
|
|
'--count',
|
|
|
|
commit_range
|
|
|
|
]
|
2020-10-30 10:05:38 +00:00
|
|
|
return int(subprocess.check_output(args).decode('utf-8').strip())
|
2020-04-08 15:59:14 +00:00
|
|
|
|
|
|
|
def guess_base_commit(repo):
|
|
|
|
"""Guess which commit the patches might be based on"""
|
|
|
|
try:
|
|
|
|
upstream_head = get_upstream_head(repo)
|
|
|
|
num_commits = get_commit_count(repo, upstream_head + '..')
|
|
|
|
return [upstream_head, num_commits]
|
|
|
|
except subprocess.CalledProcessError:
|
|
|
|
args = [
|
|
|
|
'git',
|
|
|
|
'-C',
|
|
|
|
repo,
|
|
|
|
'describe',
|
|
|
|
'--tags',
|
|
|
|
]
|
2020-10-30 10:05:38 +00:00
|
|
|
return subprocess.check_output(args).decode('utf-8').rsplit('-', 2)[0:2]
|
2020-04-08 15:59:14 +00:00
|
|
|
|
|
|
|
|
|
|
|
def format_patch(repo, since):
|
|
|
|
args = [
|
|
|
|
'git',
|
|
|
|
'-C',
|
|
|
|
repo,
|
|
|
|
'-c',
|
2020-10-30 10:05:38 +00:00
|
|
|
'core.attributesfile='
|
|
|
|
+ os.path.join(
|
|
|
|
os.path.dirname(os.path.realpath(__file__)),
|
|
|
|
'electron.gitattributes',
|
|
|
|
),
|
2020-04-08 15:59:14 +00:00
|
|
|
# Ensure it is not possible to match anything
|
|
|
|
# Disabled for now as we have consistent chunk headers
|
|
|
|
# '-c',
|
|
|
|
# 'diff.electron.xfuncname=$^',
|
|
|
|
'format-patch',
|
|
|
|
'--keep-subject',
|
|
|
|
'--no-stat',
|
|
|
|
'--stdout',
|
|
|
|
|
|
|
|
# Per RFC 3676 the signature is separated from the body by a line with
|
|
|
|
# '-- ' on it. If the signature option is omitted the signature defaults
|
|
|
|
# to the Git version number.
|
|
|
|
'--no-signature',
|
|
|
|
|
|
|
|
# The name of the parent commit object isn't useful information in this
|
|
|
|
# context, so zero it out to avoid needless patch-file churn.
|
|
|
|
'--zero-commit',
|
|
|
|
|
|
|
|
# Some versions of git print out different numbers of characters in the
|
|
|
|
# 'index' line of patches, so pass --full-index to get consistent
|
|
|
|
# behaviour.
|
|
|
|
'--full-index',
|
|
|
|
since
|
|
|
|
]
|
2020-10-30 10:05:38 +00:00
|
|
|
return subprocess.check_output(args).decode('utf-8')
|
2020-04-08 15:59:14 +00:00
|
|
|
|
|
|
|
|
|
|
|
def split_patches(patch_data):
|
|
|
|
"""Split a concatenated series of patches into N separate patches"""
|
|
|
|
patches = []
|
|
|
|
patch_start = re.compile('^From [0-9a-f]+ ')
|
2021-03-25 05:49:53 +00:00
|
|
|
# Keep line endings in case any patches target files with CRLF.
|
|
|
|
keep_line_endings = True
|
|
|
|
for line in patch_data.splitlines(keep_line_endings):
|
2020-04-08 15:59:14 +00:00
|
|
|
if patch_start.match(line):
|
|
|
|
patches.append([])
|
|
|
|
patches[-1].append(line)
|
|
|
|
return patches
|
|
|
|
|
|
|
|
|
|
|
|
def munge_subject_to_filename(subject):
|
|
|
|
"""Derive a suitable filename from a commit's subject"""
|
|
|
|
if subject.endswith('.patch'):
|
|
|
|
subject = subject[:-6]
|
|
|
|
return re.sub(r'[^A-Za-z0-9-]+', '_', subject).strip('_').lower() + '.patch'
|
|
|
|
|
|
|
|
|
|
|
|
def get_file_name(patch):
|
|
|
|
"""Return the name of the file to which the patch should be written"""
|
2021-03-25 05:49:53 +00:00
|
|
|
file_name = None
|
2020-04-08 15:59:14 +00:00
|
|
|
for line in patch:
|
|
|
|
if line.startswith('Patch-Filename: '):
|
2021-03-25 05:49:53 +00:00
|
|
|
file_name = line[len('Patch-Filename: '):]
|
|
|
|
break
|
2020-04-08 15:59:14 +00:00
|
|
|
# If no patch-filename header, munge the subject.
|
2021-03-25 05:49:53 +00:00
|
|
|
if not file_name:
|
|
|
|
for line in patch:
|
|
|
|
if line.startswith('Subject: '):
|
|
|
|
file_name = munge_subject_to_filename(line[len('Subject: '):])
|
|
|
|
break
|
|
|
|
return file_name.rstrip('\n')
|
|
|
|
|
|
|
|
|
|
|
|
def join_patch(patch):
|
|
|
|
"""Joins and formats patch contents"""
|
|
|
|
return ''.join(remove_patch_filename(patch)).rstrip('\n') + '\n'
|
2020-04-08 15:59:14 +00:00
|
|
|
|
|
|
|
|
|
|
|
def remove_patch_filename(patch):
|
|
|
|
"""Strip out the Patch-Filename trailer from a patch's message body"""
|
|
|
|
force_keep_next_line = False
|
|
|
|
for i, l in enumerate(patch):
|
|
|
|
is_patchfilename = l.startswith('Patch-Filename: ')
|
2020-10-30 10:05:38 +00:00
|
|
|
next_is_patchfilename = i < len(patch) - 1 and patch[i + 1].startswith(
|
|
|
|
'Patch-Filename: '
|
|
|
|
)
|
|
|
|
if not force_keep_next_line and (
|
|
|
|
is_patchfilename or (next_is_patchfilename and len(l.rstrip()) == 0)
|
|
|
|
):
|
|
|
|
pass # drop this line
|
2020-04-08 15:59:14 +00:00
|
|
|
else:
|
|
|
|
yield l
|
|
|
|
force_keep_next_line = l.startswith('Subject: ')
|
|
|
|
|
|
|
|
|
2020-06-05 00:43:28 +00:00
|
|
|
def export_patches(repo, out_dir, patch_range=None, dry_run=False):
|
2020-04-08 15:59:14 +00:00
|
|
|
if patch_range is None:
|
|
|
|
patch_range, num_patches = guess_base_commit(repo)
|
2020-10-30 10:05:38 +00:00
|
|
|
sys.stderr.write(
|
2021-01-04 19:24:59 +00:00
|
|
|
"Exporting {} patches in {} since {}\n".format(num_patches, repo, patch_range[0:7])
|
2020-10-30 10:05:38 +00:00
|
|
|
)
|
2020-04-08 15:59:14 +00:00
|
|
|
patch_data = format_patch(repo, patch_range)
|
|
|
|
patches = split_patches(patch_data)
|
|
|
|
|
|
|
|
try:
|
|
|
|
os.mkdir(out_dir)
|
|
|
|
except OSError:
|
|
|
|
pass
|
|
|
|
|
2020-06-05 00:43:28 +00:00
|
|
|
if dry_run:
|
|
|
|
# If we're doing a dry run, iterate through each patch and see if the newly
|
2020-10-30 10:05:38 +00:00
|
|
|
# exported patch differs from what exists. Report number of mismatched
|
|
|
|
# patches and fail if there's more than one.
|
2021-03-31 20:48:21 +00:00
|
|
|
bad_patches = []
|
2020-04-08 15:59:14 +00:00
|
|
|
for patch in patches:
|
|
|
|
filename = get_file_name(patch)
|
2020-10-30 10:05:38 +00:00
|
|
|
filepath = posixpath.join(out_dir, filename)
|
2021-03-31 20:48:21 +00:00
|
|
|
existing_patch = unicode(io.open(filepath, 'rb').read(), "utf-8")
|
2021-03-25 05:49:53 +00:00
|
|
|
formatted_patch = join_patch(patch)
|
2020-06-05 00:43:28 +00:00
|
|
|
if formatted_patch != existing_patch:
|
2021-03-31 20:48:21 +00:00
|
|
|
bad_patches.append(filename)
|
2021-04-01 23:27:35 +00:00
|
|
|
if len(bad_patches) > 0:
|
2020-10-30 10:05:38 +00:00
|
|
|
sys.stderr.write(
|
2021-03-31 20:48:21 +00:00
|
|
|
"Patches in {} not up to date: {} patches need update\n-- {}\n".format(
|
2021-04-01 23:27:35 +00:00
|
|
|
out_dir, len(bad_patches), "\n-- ".join(bad_patches)
|
2020-10-30 10:05:38 +00:00
|
|
|
)
|
|
|
|
)
|
2020-06-05 00:43:28 +00:00
|
|
|
exit(1)
|
|
|
|
else:
|
|
|
|
# Remove old patches so that deleted commits are correctly reflected in the
|
|
|
|
# patch files (as a removed file)
|
|
|
|
for p in os.listdir(out_dir):
|
|
|
|
if p.endswith('.patch'):
|
2020-10-30 10:05:38 +00:00
|
|
|
os.remove(posixpath.join(out_dir, p))
|
|
|
|
with io.open(
|
|
|
|
posixpath.join(out_dir, '.patches'),
|
|
|
|
'w',
|
|
|
|
newline='\n',
|
|
|
|
encoding='utf-8',
|
|
|
|
) as pl:
|
2020-06-05 00:43:28 +00:00
|
|
|
for patch in patches:
|
|
|
|
filename = get_file_name(patch)
|
2020-10-30 10:05:38 +00:00
|
|
|
file_path = posixpath.join(out_dir, filename)
|
2021-03-25 05:49:53 +00:00
|
|
|
formatted_patch = join_patch(patch)
|
|
|
|
# Write in binary mode to retain mixed line endings on write.
|
2020-10-30 10:05:38 +00:00
|
|
|
with io.open(
|
2021-03-25 05:49:53 +00:00
|
|
|
file_path, 'wb'
|
2020-10-30 10:05:38 +00:00
|
|
|
) as f:
|
2021-03-25 05:49:53 +00:00
|
|
|
f.write(formatted_patch.encode('utf-8'))
|
2020-06-05 00:43:28 +00:00
|
|
|
pl.write(filename + '\n')
|
|
|
|
|