2020-01-15 17:40:32 +01:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
# Copyright 2019 Google LLC
|
|
|
|
#
|
|
|
|
# Licensed under the the Apache License v2.0 with LLVM Exceptions (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# https://llvm.org/LICENSE.txt
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2020-02-04 14:18:19 +01:00
|
|
|
|
2020-01-15 17:40:32 +01:00
|
|
|
import argparse
|
2020-05-12 08:46:24 +02:00
|
|
|
import datetime
|
2020-01-15 17:40:32 +01:00
|
|
|
import json
|
|
|
|
import os
|
|
|
|
import re
|
2020-02-06 11:28:30 +01:00
|
|
|
import socket
|
2020-01-15 17:40:32 +01:00
|
|
|
import subprocess
|
2020-02-06 11:28:30 +01:00
|
|
|
import time
|
2020-01-15 17:40:32 +01:00
|
|
|
from typing import List, Optional, Tuple
|
|
|
|
|
|
|
|
from phabricator import Phabricator
|
2020-03-25 07:09:31 +01:00
|
|
|
from git import Repo, BadName, GitCommandError
|
2020-03-23 10:39:49 +01:00
|
|
|
|
|
|
|
|
|
|
|
# FIXME: maybe move to config file
|
2020-05-12 08:46:24 +02:00
|
|
|
"""URL of upstream LLVM repository."""
|
2020-03-23 10:39:49 +01:00
|
|
|
LLVM_GITHUB_URL = 'ssh://git@github.com/llvm/llvm-project'
|
2020-01-15 17:40:32 +01:00
|
|
|
|
2020-05-12 08:46:24 +02:00
|
|
|
"""How far back the script searches in the git history to find Revisions that
|
|
|
|
have already landed. """
|
|
|
|
APPLIED_SCAN_LIMIT = datetime.timedelta(days=90)
|
|
|
|
|
2020-02-04 14:18:19 +01:00
|
|
|
|
2020-01-15 17:40:32 +01:00
|
|
|
class ApplyPatch:
|
|
|
|
"""Apply a diff from Phabricator on local working copy.
|
|
|
|
|
|
|
|
This script is a rewrite of `arc patch` to accomodate for dependencies
|
|
|
|
that have already landed, but could not be identified by `arc patch`.
|
|
|
|
|
|
|
|
For a given diff_id, this class will get the dependencies listed on Phabricator.
|
2020-02-04 14:18:19 +01:00
|
|
|
For each dependency D it will check the diff history:
|
|
|
|
- if D has already landed, skip it.
|
|
|
|
- If D has not landed, it will download the patch for D and try to apply it locally.
|
|
|
|
Once this class has applied all dependencies, it will apply the diff itself.
|
2020-01-15 17:40:32 +01:00
|
|
|
|
|
|
|
This script must be called from the root folder of a local checkout of
|
|
|
|
https://github.com/llvm/llvm-project
|
|
|
|
"""
|
|
|
|
|
2020-03-23 10:39:49 +01:00
|
|
|
def __init__(self, diff_id: int, comment_file_path: str, token: str, url: str, git_hash: str,
|
|
|
|
push_branch: bool = False):
|
2020-01-15 17:40:32 +01:00
|
|
|
self.comment_file_path = comment_file_path
|
2020-03-23 10:39:49 +01:00
|
|
|
self.push_branch = push_branch # type: bool
|
2020-02-04 14:18:19 +01:00
|
|
|
self.conduit_token = token # type: Optional[str]
|
2020-01-15 17:40:32 +01:00
|
|
|
self.host = url # type: Optional[str]
|
|
|
|
self._load_arcrc()
|
2020-02-04 14:18:19 +01:00
|
|
|
self.diff_id = diff_id # type: int
|
2020-01-15 17:40:32 +01:00
|
|
|
if not self.host.endswith('/api/'):
|
|
|
|
self.host += '/api/'
|
2020-01-20 12:06:57 +01:00
|
|
|
self.phab = self._create_phab()
|
2020-02-04 14:33:56 +01:00
|
|
|
self.base_revision = git_hash # type: Optional[str]
|
2020-01-15 17:40:32 +01:00
|
|
|
self.msg = [] # type: List[str]
|
|
|
|
self.repo = Repo(os.getcwd()) # type: Repo
|
|
|
|
|
2020-03-23 10:39:49 +01:00
|
|
|
@property
|
|
|
|
def branch_name(self):
|
|
|
|
"""Name used for the git branch."""
|
|
|
|
return 'phab-diff-{}'.format(self.diff_id)
|
|
|
|
|
2020-01-15 17:40:32 +01:00
|
|
|
def _load_arcrc(self):
|
|
|
|
"""Load arc configuration from file if not set."""
|
|
|
|
if self.conduit_token is not None or self.host is not None:
|
|
|
|
return
|
|
|
|
print('Loading configuration from ~/.arcrc file')
|
|
|
|
with open(os.path.expanduser('~/.arcrc'), 'r') as arcrc_file:
|
|
|
|
arcrc = json.load(arcrc_file)
|
|
|
|
# use the first host configured in the file
|
|
|
|
self.host = next(iter(arcrc['hosts']))
|
|
|
|
self.conduit_token = arcrc['hosts'][self.host]['token']
|
|
|
|
|
|
|
|
def run(self):
|
|
|
|
"""try to apply the patch from phabricator
|
|
|
|
|
|
|
|
Write to `self.comment_file` for showing error messages on Phabricator.
|
|
|
|
"""
|
|
|
|
|
|
|
|
try:
|
2020-03-23 10:39:49 +01:00
|
|
|
self._refresh_master()
|
2020-02-04 14:33:56 +01:00
|
|
|
revision_id, dependencies, base_revision = self._get_dependencies(self.diff_id)
|
|
|
|
dependencies.reverse() # Arrange deps in chronological order.
|
2020-03-23 10:39:49 +01:00
|
|
|
self._create_branch(base_revision)
|
2020-01-22 13:19:31 +01:00
|
|
|
print('git reset, git cleanup...')
|
2020-01-22 13:08:51 +01:00
|
|
|
self.repo.git.reset('--hard')
|
2020-01-20 14:04:09 +01:00
|
|
|
self.repo.git.clean('-fdx')
|
2020-01-15 17:40:32 +01:00
|
|
|
print('Analyzing {}'.format(diff_to_str(revision_id)))
|
|
|
|
if len(dependencies) > 0:
|
|
|
|
print('This diff depends on: {}'.format(diff_list_to_str(dependencies)))
|
|
|
|
missing, landed = self._get_missing_landed_dependencies(dependencies)
|
2020-02-04 14:33:56 +01:00
|
|
|
print(' Already landed: {}'.format(diff_list_to_str(landed)))
|
|
|
|
print(' Will be applied: {}'.format(diff_list_to_str(missing)))
|
|
|
|
if missing:
|
|
|
|
for revision in missing:
|
|
|
|
self._apply_revision(revision)
|
2020-03-23 10:39:49 +01:00
|
|
|
# FIXME: submit every Revision individually to get nicer history, use original user name
|
2020-02-04 14:33:56 +01:00
|
|
|
self.repo.config_writer().set_value("user", "name", "myusername").release()
|
|
|
|
self.repo.config_writer().set_value("user", "email", "myemail@example.com").release()
|
|
|
|
self.repo.git.commit('-a', '-m', 'dependencies')
|
2020-02-04 14:18:19 +01:00
|
|
|
print('All depended diffs are applied')
|
2020-01-15 17:40:32 +01:00
|
|
|
self._apply_diff(self.diff_id, revision_id)
|
2020-03-23 10:39:49 +01:00
|
|
|
if self.push_branch:
|
|
|
|
self._commit_and_push()
|
|
|
|
else:
|
|
|
|
self.repo.git.add('-u', '.')
|
2020-01-20 14:16:45 +01:00
|
|
|
print('done.')
|
2020-01-15 17:40:32 +01:00
|
|
|
finally:
|
|
|
|
self._write_error_message()
|
|
|
|
|
2020-03-23 10:39:49 +01:00
|
|
|
def _refresh_master(self):
|
|
|
|
"""Update local git repo and origin.
|
|
|
|
|
|
|
|
As origin is disjoint from upstream, it needs to be updated by this script.
|
|
|
|
"""
|
|
|
|
if not self.push_branch:
|
|
|
|
return
|
|
|
|
|
|
|
|
print('Syncing local, origin and upstream...')
|
|
|
|
self.repo.git.fetch('--all')
|
|
|
|
self.repo.git.checkout('master')
|
|
|
|
self.repo.git.reset('--hard')
|
|
|
|
self.repo.git.clean('-fdx')
|
|
|
|
if 'upstream' not in self.repo.remotes:
|
|
|
|
self.repo.create_remote('upstream', url=LLVM_GITHUB_URL)
|
|
|
|
self.repo.remotes.upstream.fetch()
|
2020-03-25 07:09:31 +01:00
|
|
|
self.repo.git.pull('origin', 'master')
|
2020-03-23 10:39:49 +01:00
|
|
|
self.repo.git.pull('upstream', 'master')
|
2020-03-25 07:09:31 +01:00
|
|
|
try:
|
|
|
|
self.repo.git.push('origin', 'master')
|
|
|
|
print('refresh of master branch completed')
|
|
|
|
except GitCommandError as e:
|
2020-04-17 16:25:27 +02:00
|
|
|
print('Info: Could not push to origin master.')
|
2020-03-23 10:39:49 +01:00
|
|
|
|
|
|
|
def _create_branch(self, base_revision: Optional[str]):
|
|
|
|
self.repo.git.fetch('--all')
|
|
|
|
if self.branch_name in self.repo.heads:
|
|
|
|
self.repo.delete_head('--force', self.branch_name)
|
|
|
|
if self.base_revision is not None:
|
|
|
|
print('Using base revision provided by command line\n{} instead of resolved\n{}'.format(
|
|
|
|
self.base_revision, base_revision))
|
|
|
|
base_revision = self.base_revision
|
|
|
|
try:
|
|
|
|
commit = self.repo.commit()
|
|
|
|
except BadName:
|
|
|
|
print('Revision {} not found in upstream repository, using master instead.'.format(base_revision))
|
|
|
|
commit = self.repo.heads['master']
|
|
|
|
new_branch = self.repo.create_head(self.branch_name, commit.hexsha)
|
|
|
|
self.repo.head.reference = new_branch
|
|
|
|
self.repo.head.reset(index=True, working_tree=True)
|
|
|
|
print('Base revision is {}'.format(self.repo.head.commit.hexsha))
|
|
|
|
|
|
|
|
def _commit_and_push(self):
|
|
|
|
"""Commit the patch and push it to origin."""
|
|
|
|
if not self.push_branch:
|
|
|
|
return
|
|
|
|
|
|
|
|
self.repo.git.add('-A')
|
|
|
|
self.repo.index.commit(message='applying Diff {}'.format(
|
|
|
|
self.diff_id))
|
|
|
|
self.repo.git.push('--force', 'origin', self.branch_name)
|
|
|
|
print('Branch {} pushed to origin'.format(self.branch_name))
|
|
|
|
pass
|
|
|
|
|
2020-01-20 12:37:49 +01:00
|
|
|
def _create_phab(self):
|
2020-01-20 12:06:57 +01:00
|
|
|
phab = Phabricator(token=self.conduit_token, host=self.host)
|
2020-02-07 08:12:51 +01:00
|
|
|
try_call(lambda: phab.update_interfaces())
|
2020-01-20 12:06:57 +01:00
|
|
|
return phab
|
|
|
|
|
2020-02-04 14:18:19 +01:00
|
|
|
def _get_diff(self, diff_id: int):
|
2020-01-15 17:40:32 +01:00
|
|
|
"""Get a diff from Phabricator based on it's diff id."""
|
2020-02-06 11:28:30 +01:00
|
|
|
return try_call(lambda: self.phab.differential.getdiff(diff_id=diff_id))
|
2020-01-15 17:40:32 +01:00
|
|
|
|
|
|
|
def _get_revision(self, revision_id: int):
|
|
|
|
"""Get a revision from Phabricator based on its revision id."""
|
2020-02-06 11:28:30 +01:00
|
|
|
return try_call(lambda: self.phab.differential.query(ids=[revision_id])[0])
|
2020-01-15 17:40:32 +01:00
|
|
|
|
2020-02-04 14:18:19 +01:00
|
|
|
def _get_revisions(self, *, phids: List[str] = None):
|
2020-01-15 17:40:32 +01:00
|
|
|
"""Get a list of revisions from Phabricator based on their PH-IDs."""
|
2020-01-20 13:29:58 +01:00
|
|
|
if phids is None:
|
2020-02-04 14:18:19 +01:00
|
|
|
raise Exception('_get_revisions phids is None')
|
|
|
|
if not phids:
|
2020-01-20 13:29:58 +01:00
|
|
|
# Handle an empty query locally. Otherwise the connection
|
|
|
|
# will time out.
|
|
|
|
return []
|
2020-02-06 11:28:30 +01:00
|
|
|
return try_call(lambda: self.phab.differential.query(phids=phids))
|
2020-01-15 17:40:32 +01:00
|
|
|
|
2020-02-04 14:33:56 +01:00
|
|
|
def _get_dependencies(self, diff_id) -> Tuple[int, List[int], str]:
|
|
|
|
"""Get all dependencies for the diff.
|
|
|
|
They are listed in reverse chronological order - from most recent to least recent."""
|
|
|
|
|
|
|
|
print('Getting dependencies of {}'.format(diff_id))
|
|
|
|
diff = self._get_diff(diff_id)
|
2020-01-22 11:39:10 +01:00
|
|
|
revision_id = int(diff.revisionID)
|
2020-01-15 17:40:32 +01:00
|
|
|
revision = self._get_revision(revision_id)
|
2020-01-22 11:39:10 +01:00
|
|
|
base_revision = diff['sourceControlBaseRevision']
|
|
|
|
if base_revision is None or len(base_revision) == 0:
|
|
|
|
base_revision = 'master'
|
2020-01-15 17:40:32 +01:00
|
|
|
dependency_ids = revision['auxiliary']['phabricator:depends-on']
|
|
|
|
revisions = self._get_revisions(phids=dependency_ids)
|
2020-02-04 14:33:56 +01:00
|
|
|
result = []
|
|
|
|
# Recursively resolve dependencies of those diffs.
|
|
|
|
for r in revisions:
|
|
|
|
_, sub, _ = self._get_dependencies(r['diffs'][0])
|
|
|
|
result.append(r['id'])
|
|
|
|
result.extend(sub)
|
|
|
|
|
|
|
|
return revision_id, result, base_revision
|
2020-01-15 17:40:32 +01:00
|
|
|
|
|
|
|
def _apply_diff(self, diff_id: int, revision_id: int):
|
|
|
|
"""Download and apply a diff to the local working copy."""
|
|
|
|
print('Applying diff {} for revision {}...'.format(diff_id, diff_to_str(revision_id)))
|
2020-02-04 14:24:07 +01:00
|
|
|
# TODO: print diff or URL to it
|
2020-02-06 11:28:30 +01:00
|
|
|
diff = try_call(lambda: self.phab.differential.getrawdiff(diffID=str(diff_id)).response)
|
2020-04-17 16:33:26 +02:00
|
|
|
proc = subprocess.run('git apply -', input=diff, shell=True, text=True,
|
2020-02-04 14:18:19 +01:00
|
|
|
stdout=subprocess.PIPE, stderr=subprocess.PIPE)
|
2020-01-15 17:40:32 +01:00
|
|
|
if proc.returncode != 0:
|
|
|
|
raise Exception('Applying patch failed:\n{}'.format(proc.stdout + proc.stderr))
|
|
|
|
|
|
|
|
def _apply_revision(self, revision_id: int):
|
|
|
|
"""Download and apply the latest diff of a revision to the local working copy."""
|
|
|
|
revision = self._get_revision(revision_id)
|
|
|
|
# take the diff_id with the highest number, this should be latest one
|
|
|
|
diff_id = max(revision['diffs'])
|
|
|
|
self._apply_diff(diff_id, revision_id)
|
|
|
|
|
|
|
|
def _write_error_message(self):
|
|
|
|
"""Write the log message to a file."""
|
|
|
|
if self.comment_file_path is None:
|
|
|
|
return
|
|
|
|
|
|
|
|
if len(self.msg) == 0:
|
|
|
|
return
|
|
|
|
print('writing error message to {}'.format(self.comment_file_path))
|
|
|
|
with open(self.comment_file_path, 'a') as comment_file:
|
|
|
|
text = '\n\n'.join(self.msg)
|
|
|
|
comment_file.write(text)
|
|
|
|
|
2020-05-12 08:46:24 +02:00
|
|
|
def _get_landed_revisions(self):
|
2020-01-15 17:40:32 +01:00
|
|
|
"""Get list of landed revisions from current git branch."""
|
2020-04-17 16:33:51 +02:00
|
|
|
diff_regex = re.compile(r'^Differential Revision: https://reviews\.llvm\.org/(.*)$', re.MULTILINE)
|
2020-02-04 14:33:56 +01:00
|
|
|
earliest_commit = None
|
|
|
|
rev = self.base_revision
|
2020-05-12 08:46:24 +02:00
|
|
|
age_limit = datetime.datetime.now() - APPLIED_SCAN_LIMIT
|
2020-02-04 14:33:56 +01:00
|
|
|
if rev is None:
|
|
|
|
rev = 'master'
|
2020-05-12 08:46:24 +02:00
|
|
|
for commit in self.repo.iter_commits(rev):
|
|
|
|
if datetime.datetime.fromtimestamp(commit.committed_date) < age_limit:
|
|
|
|
break
|
2020-02-04 14:33:56 +01:00
|
|
|
earliest_commit = commit
|
2020-01-15 17:40:32 +01:00
|
|
|
result = diff_regex.search(commit.message)
|
|
|
|
if result is not None:
|
|
|
|
yield result.group(1)
|
2020-02-04 14:33:56 +01:00
|
|
|
if earliest_commit is not None:
|
|
|
|
print('Earliest analyzed commit in history', earliest_commit.hexsha, earliest_commit.committed_datetime)
|
2020-01-15 17:40:32 +01:00
|
|
|
return
|
|
|
|
|
|
|
|
def _get_missing_landed_dependencies(self, dependencies: List[int]) -> Tuple[List[int], List[int]]:
|
|
|
|
"""Check which of the dependencies have already landed on the current branch."""
|
|
|
|
landed_deps = []
|
|
|
|
missing_deps = []
|
2020-02-04 14:18:19 +01:00
|
|
|
for dependency in dependencies:
|
2020-01-15 17:40:32 +01:00
|
|
|
if diff_to_str(dependency) in self._get_landed_revisions():
|
|
|
|
landed_deps.append(dependency)
|
|
|
|
else:
|
|
|
|
missing_deps.append(dependency)
|
|
|
|
return missing_deps, landed_deps
|
|
|
|
|
|
|
|
|
|
|
|
def diff_to_str(diff: int) -> str:
|
|
|
|
"""Convert a diff id to a string with leading "D"."""
|
|
|
|
return 'D{}'.format(diff)
|
|
|
|
|
|
|
|
|
|
|
|
def diff_list_to_str(diffs: List[int]) -> str:
|
|
|
|
"""Convert list of diff ids to a comma separated list, prefixed with "D"."""
|
|
|
|
return ', '.join([diff_to_str(d) for d in diffs])
|
|
|
|
|
|
|
|
|
2020-02-06 11:28:30 +01:00
|
|
|
def try_call(call):
|
|
|
|
"""Tries to call function several times retrying on socked.timeout."""
|
|
|
|
c = 0
|
|
|
|
while True:
|
|
|
|
try:
|
|
|
|
return call()
|
|
|
|
except socket.timeout as e:
|
|
|
|
c += 1
|
|
|
|
if c > 5:
|
|
|
|
print('Connection to Pharicator failed, giving up: {}'.format(e))
|
|
|
|
raise
|
|
|
|
print('Connection to Pharicator failed, retrying: {}'.format(e))
|
|
|
|
time.sleep(c * 10)
|
|
|
|
|
|
|
|
|
2020-01-15 17:40:32 +01:00
|
|
|
if __name__ == "__main__":
|
|
|
|
parser = argparse.ArgumentParser(description='Apply Phabricator patch to working directory.')
|
2020-02-04 14:18:19 +01:00
|
|
|
parser.add_argument('diff_id', type=int)
|
|
|
|
# TODO: instead of --comment-file use stdout / stderr.
|
2020-01-15 17:40:32 +01:00
|
|
|
parser.add_argument('--comment-file', type=str, dest='comment_file_path', default=None)
|
2020-02-04 14:18:19 +01:00
|
|
|
parser.add_argument('--token', type=str, default=None, help='Conduit API token')
|
|
|
|
parser.add_argument('--url', type=str, default=None, help='Phabricator URL')
|
|
|
|
parser.add_argument('--commit', dest='commit', type=str, default=None,
|
|
|
|
help='Use this commit as a base. By default tool tries to pick the base commit itself')
|
2020-03-23 10:39:49 +01:00
|
|
|
parser.add_argument('--push-branch', action='store_true', dest='push_branch',
|
|
|
|
help='choose if branch shall be pushed to origin')
|
2020-01-15 17:40:32 +01:00
|
|
|
args = parser.parse_args()
|
2020-03-23 10:39:49 +01:00
|
|
|
patcher = ApplyPatch(args.diff_id, args.comment_file_path, args.token, args.url, args.commit, args.push_branch)
|
2020-01-15 17:40:32 +01:00
|
|
|
patcher.run()
|