tagmerge.py
265 lines
| 11.2 KiB
| text/x-python
|
PythonLexer
/ mercurial / tagmerge.py
Angel Ezquerra
|
r21922 | # tagmerge.py - merge .hgtags files | ||
# | ||||
# Copyright 2014 Angel Ezquerra <angel.ezquerra@gmail.com> | ||||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
# GNU General Public License version 2 or any later version. | ||||
# This module implements an automatic merge algorithm for mercurial's tag files | ||||
# | ||||
# The tagmerge algorithm implemented in this module is able to resolve most | ||||
# merge conflicts that currently would trigger a .hgtags merge conflict. The | ||||
# only case that it does not (and cannot) handle is that in which two tags point | ||||
# to different revisions on each merge parent _and_ their corresponding tag | ||||
# histories have the same rank (i.e. the same length). In all other cases the | ||||
# merge algorithm will choose the revision belonging to the parent with the | ||||
# highest ranked tag history. The merged tag history is the combination of both | ||||
# tag histories (special care is taken to try to combine common tag histories | ||||
# where possible). | ||||
# | ||||
# In addition to actually merging the tags from two parents, taking into | ||||
# account the base, the algorithm also tries to minimize the difference | ||||
# between the merged tag file and the first parent's tag file (i.e. it tries to | ||||
# make the merged tag order as as similar as possible to the first parent's tag | ||||
# file order). | ||||
# | ||||
# The algorithm works as follows: | ||||
# 1. read the tags from p1, p2 and the base | ||||
# - when reading the p1 tags, also get the line numbers associated to each | ||||
# tag node (these will be used to sort the merged tags in a way that | ||||
# minimizes the diff to p1). Ignore the file numbers when reading p2 and | ||||
# the base | ||||
# 2. recover the "lost tags" (i.e. those that are found in the base but not on | ||||
# p1 or p2) and add them back to p1 and/or p2 | ||||
# - at this point the only tags that are on p1 but not on p2 are those new | ||||
# tags that were introduced in p1. Same thing for the tags that are on p2 | ||||
# but not on p2 | ||||
# 3. take all tags that are only on p1 or only on p2 (but not on the base) | ||||
# - Note that these are the tags that were introduced between base and p1 | ||||
# and between base and p2, possibly on separate clones | ||||
# 4. for each tag found both on p1 and p2 perform the following merge algorithm: | ||||
# - the tags conflict if their tag "histories" have the same "rank" (i.e. | ||||
# length) _AND_ the last (current) tag is _NOT_ the same | ||||
# - for non conflicting tags: | ||||
# - choose which are the high and the low ranking nodes | ||||
# - the high ranking list of nodes is the one that is longer. | ||||
# In case of draw favor p1 | ||||
# - the merged node list is made of 3 parts: | ||||
# - first the nodes that are common to the beginning of both | ||||
# the low and the high ranking nodes | ||||
# - second the non common low ranking nodes | ||||
# - finally the non common high ranking nodes (with the last | ||||
# one being the merged tag node) | ||||
# - note that this is equivalent to putting the whole low ranking | ||||
# node list first, followed by the non common high ranking nodes | ||||
# - note that during the merge we keep the "node line numbers", which will | ||||
# be used when writing the merged tags to the tag file | ||||
# 5. write the merged tags taking into account to their positions in the first | ||||
# parent (i.e. try to keep the relative ordering of the nodes that come | ||||
# from p1). This minimizes the diff between the merged and the p1 tag files | ||||
# This is donw by using the following algorithm | ||||
# - group the nodes for a given tag that must be written next to each other | ||||
# - A: nodes that come from consecutive lines on p1 | ||||
# - B: nodes that come from p2 (i.e. whose associated line number is | ||||
# None) and are next to one of the a nodes in A | ||||
# - each group is associated with a line number coming from p1 | ||||
# - generate a "tag block" for each of the groups | ||||
# - a tag block is a set of consecutive "node tag" lines belonging to | ||||
# the same tag and which will be written next to each other on the | ||||
# merged tags file | ||||
# - sort the "tag blocks" according to their associated number line | ||||
# - put blocks whose nodes come all from p2 first | ||||
# - write the tag blocks in the sorted order | ||||
import tags | ||||
import util | ||||
from node import nullid, hex | ||||
from i18n import _ | ||||
import operator | ||||
hexnullid = hex(nullid) | ||||
def readtagsformerge(ui, repo, lines, fn='', keeplinenums=False): | ||||
'''read the .hgtags file into a structure that is suitable for merging | ||||
Sepending on the keeplinenumbers flag, clear the line numbers associated | ||||
with each tag. Rhis is done because only the line numbers of the first | ||||
parent are useful for merging | ||||
''' | ||||
filetags = tags._readtaghist(ui, repo, lines, fn=fn, recode=None, | ||||
calcnodelines=True)[1] | ||||
for tagname, taginfo in filetags.items(): | ||||
if not keeplinenums: | ||||
for el in taginfo: | ||||
el[1] = None | ||||
return filetags | ||||
def grouptagnodesbyline(tagnodes): | ||||
''' | ||||
Group nearby nodes (i.e. those that must be written next to each other) | ||||
The input is a list of [node, position] pairs, corresponding to a given tag | ||||
The position is the line number where the node was found on the first parent | ||||
.hgtags file, or None for those nodes that came from the base or the second | ||||
parent .hgtags files. | ||||
This function groups those [node, position] pairs, returning a list of | ||||
groups of nodes that must be written next to each other because their | ||||
positions are consecutive or have no position preference (because their | ||||
position is None). | ||||
The result is a list of [position, [consecutive node list]] | ||||
''' | ||||
firstlinenum = None | ||||
for hexnode, linenum in tagnodes: | ||||
firstlinenum = linenum | ||||
if firstlinenum is not None: | ||||
break | ||||
if firstlinenum is None: | ||||
return [[None, [el[0] for el in tagnodes]]] | ||||
tagnodes[0][1] = firstlinenum | ||||
groupednodes = [[firstlinenum, []]] | ||||
prevlinenum = firstlinenum | ||||
for hexnode, linenum in tagnodes: | ||||
if linenum is not None and linenum - prevlinenum > 1: | ||||
groupednodes.append([linenum, []]) | ||||
groupednodes[-1][1].append(hexnode) | ||||
if linenum is not None: | ||||
prevlinenum = linenum | ||||
return groupednodes | ||||
def writemergedtags(repo, mergedtags): | ||||
''' | ||||
write the merged tags while trying to minimize the diff to the first parent | ||||
This function uses the ordering info stored on the merged tags dict to | ||||
generate an .hgtags file which is correct (in the sense that its contents | ||||
correspond to the result of the tag merge) while also being as close as | ||||
possible to the first parent's .hgtags file. | ||||
''' | ||||
# group the node-tag pairs that must be written next to each other | ||||
for tname, taglist in mergedtags.items(): | ||||
mergedtags[tname] = grouptagnodesbyline(taglist) | ||||
# convert the grouped merged tags dict into a format that resembles the | ||||
# final .hgtags file (i.e. a list of blocks of 'node tag' pairs) | ||||
def taglist2string(tlist, tname): | ||||
return '\n'.join(['%s %s' % (hexnode, tname) for hexnode in tlist]) | ||||
finaltags = [] | ||||
for tname, tags in mergedtags.items(): | ||||
for block in tags: | ||||
block[1] = taglist2string(block[1], tname) | ||||
finaltags += tags | ||||
# the tag groups are linked to a "position" that can be used to sort them | ||||
# before writing them | ||||
# the position is calculated to ensure that the diff of the merged .hgtags | ||||
# file to the first parent's .hgtags file is as small as possible | ||||
finaltags.sort(key=operator.itemgetter(0)) | ||||
# finally we can join the sorted groups to get the final contents of the | ||||
# merged .hgtags file, and then write it to disk | ||||
mergedtagstring = '\n'.join([tags for rank, tags in finaltags if tags]) | ||||
fp = repo.wfile('.hgtags', 'wb') | ||||
fp.write(mergedtagstring + '\n') | ||||
fp.close() | ||||
def singletagmerge(p1nodes, p2nodes): | ||||
''' | ||||
merge the nodes corresponding to a single tag | ||||
Note that the inputs are lists of node-linenum pairs (i.e. not just lists | ||||
of nodes) | ||||
''' | ||||
if not p2nodes: | ||||
return p1nodes | ||||
if not p1nodes: | ||||
return p2nodes | ||||
# there is no conflict unless both tags point to different revisions | ||||
# and have a non identical tag history | ||||
p1currentnode = p1nodes[-1][0] | ||||
p2currentnode = p2nodes[-1][0] | ||||
if p1currentnode != p2currentnode and len(p1nodes) == len(p2nodes): | ||||
# cannot merge two tags with same rank pointing to different nodes | ||||
return None | ||||
# which are the highest ranking (hr) / lowest ranking (lr) nodes? | ||||
if len(p1nodes) >= len(p2nodes): | ||||
hrnodes, lrnodes = p1nodes, p2nodes | ||||
else: | ||||
hrnodes, lrnodes = p2nodes, p1nodes | ||||
# the lowest ranking nodes will be written first, followed by the highest | ||||
# ranking nodes | ||||
# to avoid unwanted tag rank explosion we try to see if there are some | ||||
# common nodes that can be written only once | ||||
commonidx = len(lrnodes) | ||||
for n in range(len(lrnodes)): | ||||
if hrnodes[n][0] != lrnodes[n][0]: | ||||
commonidx = n | ||||
break | ||||
lrnodes[n][1] = p1nodes[n][1] | ||||
# the merged node list has 3 parts: | ||||
# - common nodes | ||||
# - non common lowest ranking nodes | ||||
# - non common highest ranking nodes | ||||
# note that the common nodes plus the non common lowest ranking nodes is the | ||||
# whole list of lr nodes | ||||
return lrnodes + hrnodes[commonidx:] | ||||
def merge(repo, fcd, fco, fca): | ||||
''' | ||||
Merge the tags of two revisions, taking into account the base tags | ||||
Try to minimize the diff between the merged tags and the first parent tags | ||||
''' | ||||
ui = repo.ui | ||||
# read the p1, p2 and base tags | ||||
# only keep the line numbers for the p1 tags | ||||
p1tags = readtagsformerge( | ||||
ui, repo, fcd.data().splitlines(), fn="p1 tags", | ||||
keeplinenums=True) | ||||
p2tags = readtagsformerge( | ||||
ui, repo, fco.data().splitlines(), fn="p2 tags", | ||||
keeplinenums=False) | ||||
basetags = readtagsformerge( | ||||
ui, repo, fca.data().splitlines(), fn="base tags", | ||||
keeplinenums=False) | ||||
# recover the list of "lost tags" (i.e. those that were found on the base | ||||
# revision but not on one of the revisions being merged) | ||||
basetagset = set(basetags) | ||||
for n, pntags in enumerate((p1tags, p2tags)): | ||||
pntagset = set(pntags) | ||||
pnlosttagset = basetagset - pntagset | ||||
for t in pnlosttagset: | ||||
pntags[t] = basetags[t] | ||||
if pntags[t][-1][0] != hexnullid: | ||||
pntags[t].append([hexnullid, None]) | ||||
conflictedtags = [] # for reporting purposes | ||||
mergedtags = util.sortdict(p1tags) | ||||
# sortdict does not implement iteritems() | ||||
for tname, p2nodes in p2tags.items(): | ||||
if tname not in mergedtags: | ||||
mergedtags[tname] = p2nodes | ||||
continue | ||||
p1nodes = mergedtags[tname] | ||||
mergednodes = singletagmerge(p1nodes, p2nodes) | ||||
if mergednodes is None: | ||||
conflictedtags.append(tname) | ||||
continue | ||||
mergedtags[tname] = mergednodes | ||||
if conflictedtags: | ||||
numconflicts = len(conflictedtags) | ||||
ui.warn(_('automatic .hgtags merge failed\n' | ||||
'the following %d tags are in conflict: %s\n') | ||||
% (numconflicts, ', '.join(sorted(conflictedtags)))) | ||||
return True, 1 | ||||
writemergedtags(repo, mergedtags) | ||||
ui.note(_('.hgtags merged successfully\n')) | ||||
return False, 0 | ||||