summaryrefslogtreecommitdiffstats
path: root/testing/web-platform/update/upstream.py
diff options
context:
space:
mode:
Diffstat (limited to 'testing/web-platform/update/upstream.py')
-rw-r--r--testing/web-platform/update/upstream.py475
1 files changed, 475 insertions, 0 deletions
diff --git a/testing/web-platform/update/upstream.py b/testing/web-platform/update/upstream.py
new file mode 100644
index 0000000000..21efc72a13
--- /dev/null
+++ b/testing/web-platform/update/upstream.py
@@ -0,0 +1,475 @@
+# This Source Code Form is subject to the terms of the Mozilla Public
+# License, v. 2.0. If a copy of the MPL was not distributed with this
+# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+
+import os
+import re
+import subprocess
+import sys
+import tempfile
+
+from six.moves import input
+from six.moves.urllib import parse as urlparse
+from wptrunner.update.base import Step, StepRunner, exit_clean, exit_unclean
+from wptrunner.update.tree import get_unique_name
+
+from .github import GitHub
+from .tree import Commit, GitTree, Patch
+
+
+def rewrite_patch(patch, strip_dir):
+ """Take a Patch and convert to a different repository by stripping a prefix from the
+ file paths. Also rewrite the message to remove the bug number and reviewer, but add
+ a bugzilla link in the summary.
+
+ :param patch: the Patch to convert
+ :param strip_dir: the path prefix to remove
+ """
+
+ if not strip_dir.startswith("/"):
+ strip_dir = "/%s" % strip_dir
+
+ new_diff = []
+ line_starts = [
+ ("diff ", True),
+ ("+++ ", True),
+ ("--- ", True),
+ ("rename from ", False),
+ ("rename to ", False),
+ ]
+ for line in patch.diff.split("\n"):
+ for start, leading_slash in line_starts:
+ strip = strip_dir if leading_slash else strip_dir[1:]
+ if line.startswith(start):
+ new_diff.append(line.replace(strip, "").encode("utf8"))
+ break
+ else:
+ new_diff.append(line)
+
+ new_diff = "\n".join(new_diff)
+
+ assert new_diff != patch
+
+ return Patch(patch.author, patch.email, rewrite_message(patch), new_diff)
+
+
+def rewrite_message(patch):
+ if patch.message.bug is not None:
+ return "\n".join(
+ [
+ patch.message.summary,
+ patch.message.body,
+ "",
+ "Upstreamed from https://bugzilla.mozilla.org/show_bug.cgi?id=%s [ci skip]"
+ % patch.message.bug, # noqa E501
+ ]
+ )
+
+ return "\n".join(
+ [patch.message.full_summary, "%s\n[ci skip]\n" % patch.message.body]
+ )
+
+
+class SyncToUpstream(Step):
+ """Sync local changes to upstream"""
+
+ def create(self, state):
+ if not state.kwargs["upstream"]:
+ return
+
+ if not isinstance(state.local_tree, GitTree):
+ self.logger.error("Cannot sync with upstream from a non-Git checkout.")
+ return exit_clean
+
+ try:
+ import requests # noqa F401
+ except ImportError:
+ self.logger.error(
+ "Upstream sync requires the requests module to be installed"
+ )
+ return exit_clean
+
+ if not state.sync_tree:
+ os.makedirs(state.sync["path"])
+ state.sync_tree = GitTree(root=state.sync["path"])
+
+ kwargs = state.kwargs
+ with state.push(
+ ["local_tree", "sync_tree", "tests_path", "metadata_path", "sync"]
+ ):
+ state.token = kwargs["token"]
+ runner = SyncToUpstreamRunner(self.logger, state)
+ runner.run()
+
+
+class GetLastSyncData(Step):
+ """Find the gecko commit at which we last performed a sync with upstream and the upstream
+ commit that was synced."""
+
+ provides = ["sync_data_path", "last_sync_commit", "old_upstream_rev"]
+
+ def create(self, state):
+ self.logger.info("Looking for last sync commit")
+ state.sync_data_path = os.path.join(state.metadata_path, "mozilla-sync")
+ items = {}
+ with open(state.sync_data_path) as f:
+ for line in f.readlines():
+ key, value = [item.strip() for item in line.split(":", 1)]
+ items[key] = value
+
+ state.last_sync_commit = Commit(
+ state.local_tree, state.local_tree.rev_from_hg(items["local"])
+ )
+ state.old_upstream_rev = items["upstream"]
+
+ if not state.local_tree.contains_commit(state.last_sync_commit):
+ self.logger.error(
+ "Could not find last sync commit %s" % state.last_sync_commit.sha1
+ )
+ return exit_clean
+
+ self.logger.info(
+ "Last sync to web-platform-tests happened in %s"
+ % state.last_sync_commit.sha1
+ )
+
+
+class CheckoutBranch(Step):
+ """Create a branch in the sync tree pointing at the last upstream sync commit
+ and check it out"""
+
+ provides = ["branch"]
+
+ def create(self, state):
+ self.logger.info("Updating sync tree from %s" % state.sync["remote_url"])
+ state.branch = state.sync_tree.unique_branch_name(
+ "outbound_update_%s" % state.old_upstream_rev
+ )
+ state.sync_tree.update(
+ state.sync["remote_url"], state.sync["branch"], state.branch
+ )
+ state.sync_tree.checkout(state.old_upstream_rev, state.branch, force=True)
+
+
+class GetBaseCommit(Step):
+ """Find the latest upstream commit on the branch that we are syncing with"""
+
+ provides = ["base_commit"]
+
+ def create(self, state):
+ state.base_commit = state.sync_tree.get_remote_sha1(
+ state.sync["remote_url"], state.sync["branch"]
+ )
+ self.logger.debug("New base commit is %s" % state.base_commit.sha1)
+
+
+class LoadCommits(Step):
+ """Get a list of commits in the gecko tree that need to be upstreamed"""
+
+ provides = ["source_commits", "has_backouts"]
+
+ def create(self, state):
+ state.source_commits = state.local_tree.log(
+ state.last_sync_commit, state.tests_path
+ )
+
+ update_regexp = re.compile(
+ "Bug \d+ - Update web-platform-tests to revision [0-9a-f]{40}"
+ )
+
+ state.has_backouts = False
+
+ for i, commit in enumerate(state.source_commits[:]):
+ if update_regexp.match(commit.message.text):
+ # This is a previous update commit so ignore it
+ state.source_commits.remove(commit)
+ continue
+
+ elif commit.message.backouts:
+ # TODO: Add support for collapsing backouts
+ state.has_backouts = True
+
+ elif not commit.message.bug:
+ self.logger.error(
+ "Commit %i (%s) doesn't have an associated bug number."
+ % (i + 1, commit.sha1)
+ )
+ return exit_unclean
+
+ self.logger.debug("Source commits: %s" % state.source_commits)
+
+
+class SelectCommits(Step):
+ """Provide a UI to select which commits to upstream"""
+
+ def create(self, state):
+ while True:
+ commits = state.source_commits[:]
+ for i, commit in enumerate(commits):
+ print("{}:\t{}".format(i, commit.message.summary))
+
+ remove = input(
+ "Provide a space-separated list of any commits numbers "
+ "to remove from the list to upstream:\n"
+ ).strip()
+ remove_idx = set()
+ for item in remove.split(" "):
+ try:
+ item = int(item)
+ except ValueError:
+ continue
+ if item < 0 or item >= len(commits):
+ continue
+ remove_idx.add(item)
+
+ keep_commits = [
+ (i, cmt) for i, cmt in enumerate(commits) if i not in remove_idx
+ ]
+ # TODO: consider printed removed commits
+ print("Selected the following commits to keep:")
+ for i, commit in keep_commits:
+ print("{}:\t{}".format(i, commit.message.summary))
+ confirm = input("Keep the above commits? y/n\n").strip().lower()
+
+ if confirm == "y":
+ state.source_commits = [item[1] for item in keep_commits]
+ break
+
+
+class MovePatches(Step):
+ """Convert gecko commits into patches against upstream and commit these to the sync tree."""
+
+ provides = ["commits_loaded"]
+
+ def create(self, state):
+ if not hasattr(state, "commits_loaded"):
+ state.commits_loaded = 0
+
+ strip_path = os.path.relpath(state.tests_path, state.local_tree.root)
+ self.logger.debug("Stripping patch %s" % strip_path)
+
+ if not hasattr(state, "patch"):
+ state.patch = None
+
+ for commit in state.source_commits[state.commits_loaded :]:
+ i = state.commits_loaded + 1
+ self.logger.info("Moving commit %i: %s" % (i, commit.message.full_summary))
+ stripped_patch = None
+ if state.patch:
+ filename, stripped_patch = state.patch
+ if not os.path.exists(filename):
+ stripped_patch = None
+ else:
+ with open(filename) as f:
+ stripped_patch.diff = f.read()
+ state.patch = None
+ if not stripped_patch:
+ patch = commit.export_patch(state.tests_path)
+ stripped_patch = rewrite_patch(patch, strip_path)
+ if not stripped_patch.diff:
+ self.logger.info("Skipping empty patch")
+ state.commits_loaded = i
+ continue
+ try:
+ state.sync_tree.import_patch(stripped_patch)
+ except Exception:
+ with tempfile.NamedTemporaryFile(delete=False, suffix=".diff") as f:
+ f.write(stripped_patch.diff)
+ print(
+ """Patch failed to apply. Diff saved in {}
+Fix this file so it applies and run with --continue""".format(
+ f.name
+ )
+ )
+ state.patch = (f.name, stripped_patch)
+ print(state.patch)
+ sys.exit(1)
+ state.commits_loaded = i
+ input("Check for differences with upstream")
+
+
+class RebaseCommits(Step):
+ """Rebase commits from the current branch on top of the upstream destination branch.
+
+ This step is particularly likely to fail if the rebase generates merge conflicts.
+ In that case the conflicts can be fixed up locally and the sync process restarted
+ with --continue.
+ """
+
+ def create(self, state):
+ self.logger.info("Rebasing local commits")
+ continue_rebase = False
+ # Check if there's a rebase in progress
+ if os.path.exists(
+ os.path.join(state.sync_tree.root, ".git", "rebase-merge")
+ ) or os.path.exists(os.path.join(state.sync_tree.root, ".git", "rebase-apply")):
+ continue_rebase = True
+
+ try:
+ state.sync_tree.rebase(state.base_commit, continue_rebase=continue_rebase)
+ except subprocess.CalledProcessError:
+ self.logger.info(
+ "Rebase failed, fix merge and run %s again with --continue"
+ % sys.argv[0]
+ )
+ raise
+ self.logger.info("Rebase successful")
+
+
+class CheckRebase(Step):
+ """Check if there are any commits remaining after rebase"""
+
+ provides = ["rebased_commits"]
+
+ def create(self, state):
+ state.rebased_commits = state.sync_tree.log(state.base_commit)
+ if not state.rebased_commits:
+ self.logger.info("Nothing to upstream, exiting")
+ return exit_clean
+
+
+class MergeUpstream(Step):
+ """Run steps to push local commits as seperate PRs and merge upstream."""
+
+ provides = ["merge_index", "gh_repo"]
+
+ def create(self, state):
+ gh = GitHub(state.token)
+ if "merge_index" not in state:
+ state.merge_index = 0
+
+ org, name = urlparse.urlsplit(state.sync["remote_url"]).path[1:].split("/")
+ if name.endswith(".git"):
+ name = name[:-4]
+ state.gh_repo = gh.repo(org, name)
+ for commit in state.rebased_commits[state.merge_index :]:
+ with state.push(["gh_repo", "sync_tree"]):
+ state.commit = commit
+ pr_merger = PRMergeRunner(self.logger, state)
+ rv = pr_merger.run()
+ if rv is not None:
+ return rv
+ state.merge_index += 1
+
+
+class UpdateLastSyncData(Step):
+ """Update the gecko commit at which we last performed a sync with upstream."""
+
+ provides = []
+
+ def create(self, state):
+ self.logger.info("Updating last sync commit")
+ data = {
+ "local": state.local_tree.rev_to_hg(state.local_tree.rev),
+ "upstream": state.sync_tree.rev,
+ }
+ with open(state.sync_data_path, "w") as f:
+ for key, value in data.iteritems():
+ f.write("%s: %s\n" % (key, value))
+ # This gets added to the patch later on
+
+
+class MergeLocalBranch(Step):
+ """Create a local branch pointing at the commit to upstream"""
+
+ provides = ["local_branch"]
+
+ def create(self, state):
+ branch_prefix = "sync_%s" % state.commit.sha1
+ local_branch = state.sync_tree.unique_branch_name(branch_prefix)
+
+ state.sync_tree.create_branch(local_branch, state.commit)
+ state.local_branch = local_branch
+
+
+class MergeRemoteBranch(Step):
+ """Get an unused remote branch name to use for the PR"""
+
+ provides = ["remote_branch"]
+
+ def create(self, state):
+ remote_branch = "sync_%s" % state.commit.sha1
+ branches = [
+ ref[len("refs/heads/") :]
+ for sha1, ref in state.sync_tree.list_remote(state.gh_repo.url)
+ if ref.startswith("refs/heads")
+ ]
+ state.remote_branch = get_unique_name(branches, remote_branch)
+
+
+class PushUpstream(Step):
+ """Push local branch to remote"""
+
+ def create(self, state):
+ self.logger.info("Pushing commit upstream")
+ state.sync_tree.push(state.gh_repo.url, state.local_branch, state.remote_branch)
+
+
+class CreatePR(Step):
+ """Create a PR for the remote branch"""
+
+ provides = ["pr"]
+
+ def create(self, state):
+ self.logger.info("Creating a PR")
+ commit = state.commit
+ state.pr = state.gh_repo.create_pr(
+ commit.message.full_summary,
+ state.remote_branch,
+ "master",
+ commit.message.body if commit.message.body else "",
+ )
+
+
+class PRAddComment(Step):
+ """Add an issue comment indicating that the code has been reviewed already"""
+
+ def create(self, state):
+ state.pr.issue.add_comment("Code reviewed upstream.")
+
+
+class MergePR(Step):
+ """Merge the PR"""
+
+ def create(self, state):
+ self.logger.info("Merging PR")
+ state.pr.merge()
+
+
+class PRDeleteBranch(Step):
+ """Delete the remote branch"""
+
+ def create(self, state):
+ self.logger.info("Deleting remote branch")
+ state.sync_tree.push(state.gh_repo.url, "", state.remote_branch)
+
+
+class SyncToUpstreamRunner(StepRunner):
+ """Runner for syncing local changes to upstream"""
+
+ steps = [
+ GetLastSyncData,
+ CheckoutBranch,
+ GetBaseCommit,
+ LoadCommits,
+ SelectCommits,
+ MovePatches,
+ RebaseCommits,
+ CheckRebase,
+ MergeUpstream,
+ UpdateLastSyncData,
+ ]
+
+
+class PRMergeRunner(StepRunner):
+ """(Sub)Runner for creating and merging a PR"""
+
+ steps = [
+ MergeLocalBranch,
+ MergeRemoteBranch,
+ PushUpstream,
+ CreatePR,
+ PRAddComment,
+ MergePR,
+ PRDeleteBranch,
+ ]