Skip to content

Commit 6f599e7

Browse files
committed
git: Use merge-tree in patchsets
Previously patchsets used a hacky invocation of update-index to overlay changed files from old tree to new tree. In addition to being slower than necessary, this has the downside of showing upstream changes in the diff, even those that were not changed in the given review upload. Using git merge-tree for this instead is cleaner, faster, and better. We do this by "cherry-picking" the old branch with git merge-tree, but providing -X ours as the strategy. This provides a tree that looks like the new base with the old changes applied. For cases where the old changes don't apply cleanly, the ours strategy prevents conflicts by taking the version in the old tree. Although this can be a bit confusing when looking at the file as a whole, it provides a succinct way to view a difference between the old version and new version. Topic: mergetreepatch
1 parent 740c5cd commit 6f599e7

File tree

1 file changed

+29
-55
lines changed

1 file changed

+29
-55
lines changed

revup/git.py

+29-55
Original file line numberDiff line numberDiff line change
@@ -614,19 +614,28 @@ async def get_diff_summary(
614614

615615
async def merge_tree_commit(
616616
self,
617-
branch1: GitCommitHash,
618-
branch2: GitCommitHash,
617+
tree1: GitCommitHash,
618+
tree2: GitCommitHash,
619619
new_commit_info: CommitHeader,
620-
merge_base: Optional[GitCommitHash] = None,
620+
merge_base: GitCommitHash,
621+
strategy: Optional[str] = None,
621622
) -> GitCommitHash:
622623
"""
623624
Perform a combined git merge-tree and commit-tree, returning a git commit hash. Raises
624625
GitConflictException if there are conflicts while merging the trees.
625626
"""
626-
args = ["merge-tree", "--write-tree", "--messages", "-z"]
627-
if merge_base:
628-
args.extend(["--merge-base", merge_base])
629-
args.extend([branch1, branch2])
627+
args = [
628+
"merge-tree",
629+
"--write-tree",
630+
"--messages",
631+
"-z",
632+
"--merge-base",
633+
merge_base,
634+
tree1,
635+
tree2,
636+
]
637+
if strategy is not None:
638+
args.extend(["-X", strategy])
630639

631640
ret, stdout = await self.git(*args, raiseonerror=False)
632641

@@ -749,58 +758,23 @@ async def make_virtual_diff_target(
749758
) -> GitCommitHash:
750759
"""
751760
Return a commit (optionally on top of parent) that provides a way to get the diff from old
752-
head to new head while accounting for the fact that new base might have been rebased since
753-
old base. This new commit makes an effort to include only files that were actually changed,
754-
while excluding files that were changed upstream as part of the rebase.
755-
756-
We do this by resetting any files that changed in the old_base->old_head diff to their
757-
old_head versions in new_base. The returned tree will thus have the following properties
758-
when diffed against new_head.
759-
760-
For files not touched by old or new, ret->new_head won't show any diff. This is primarily
761-
what allows us to exclude upstream files.
762-
For files touched by both old and new, ret->new_head will show the entire old_head->new_head
763-
diff. This will include upstream changes for these files, which are difficult to untangle.
764-
For files not touched in old but touched by new (regardless of whether it existed in
765-
old_base), diff will show new_base->new_head.
766-
For files touched in old but not touched in new, there are 2 cases. If file exists in
767-
new_base, diff will show old_head->new_base. If file doesn't exist in new_base, diff will
768-
show old_head->(deleted) which isn't perfect since technically new_base->new_head did not
769-
delete the file, but probably the least confusing of the alternatives of showing no diff and
770-
showing the old_head->old_base diff.
771-
"""
772-
new_index: List[str] = []
773-
774-
# Transform diff-tree raw output to ls-files style output, taking only the new version
775-
for m in RE_RAW_DIFF_TREE_LINE.finditer(
776-
await self.git_stdout("diff-tree", "-r", "--no-commit-id", "--raw", old_base, old_head)
777-
):
778-
new_index.append(f"{m.group('new_mode')} {m.group('new_hash')} 0\t{m.group('path')}")
779-
780-
if not new_index:
781-
# No files were actually changed, so no diff needs to be applied to new_base
782-
return new_base
783-
784-
temp_index_path = self.get_scratch_dir() + "/index.temp"
785-
git_env = {
786-
"GIT_INDEX_FILE": temp_index_path,
787-
}
788-
shutil.copy(f"{self.git_dir}/index", temp_index_path)
789-
await self.git("reset", "-q", "--no-refresh", new_base, "--", ":/", env=git_env)
790-
await self.git(
791-
"update-index",
792-
"--index-info",
793-
input_str="\n".join(new_index),
794-
env=git_env,
795-
)
761+
head to new head while accounting for the fact that the base might have been rebased
796762
797-
tree = GitTreeHash(await self.git_stdout("write-tree", env=git_env))
798-
new_commit_info = CommitHeader(tree, [parent] if parent else [])
763+
We do this by "cherry-picking" the old branch with git merge-tree, but providing -X ours as
764+
the strategy. This provides a tree that looks like the new base with the old changes applied.
765+
For cases where the old changes don't apply cleanly, the ours strategy prevents conflicts by
766+
taking the version in the old tree. Although this can be a bit confusing when looking at the
767+
file as a whole, it provides a succinct way to view a difference between the old version and
768+
new version.
769+
"""
770+
new_commit_info = CommitHeader(GitTreeHash(""), [parent] if parent else [])
799771
new_commit_info.commit_msg = (
800-
f"revup virtual diff target\n\n{old_base}\n{old_head}\n{new_base}\n{new_head}"
772+
f"revup virtual diff target\n\n{old_base}\n{old_head}\n{new_base}\n{new_head}\n\n"
773+
"revup uses this branch internally to generate github viewable diffs. The commits and "
774+
"diffs between commits are not meaningful or useful."
801775
)
802776

803-
return await self.commit_tree(new_commit_info)
777+
return await self.merge_tree_commit(old_head, new_base, new_commit_info, old_base, "ours")
804778

805779
async def soft_reset(self, new_commit: GitCommitHash, env: Dict) -> None:
806780
await self.git("reset", "--soft", new_commit, env=env)

0 commit comments

Comments
 (0)