ancestor.py
393 lines
| 12.4 KiB
| text/x-python
|
PythonLexer
/ mercurial / ancestor.py
Matt Mackall
|
r3135 | # ancestor.py - generic DAG ancestor algorithm for mercurial | ||
# | ||||
Raphaël Gomès
|
r47575 | # Copyright 2006 Olivia Mackall <olivia@selenic.com> | ||
Matt Mackall
|
r3135 | # | ||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Matt Mackall
|
r3135 | |||
Gregory Szorc
|
r25915 | |||
Augie Fackler
|
r20034 | import heapq | ||
Gregory Szorc
|
r25915 | |||
from .node import nullrev | ||||
Gregory Szorc
|
r38806 | from . import ( | ||
Georges Racinet
|
r41280 | dagop, | ||
Georges Racinet
|
r40334 | policy, | ||
Gregory Szorc
|
r38806 | ) | ||
Matt Mackall
|
r3135 | |||
Augie Fackler
|
r43906 | parsers = policy.importmod('parsers') | ||
Georges Racinet
|
r40334 | |||
Augie Fackler
|
r43346 | |||
Mads Kiilerich
|
r21101 | def commonancestorsheads(pfunc, *nodes): | ||
"""Returns a set with the heads of all common ancestors of all nodes, | ||||
heads(::nodes[0] and ::nodes[1] and ...) . | ||||
pfunc must return a list of parent vertices for a given vertex. | ||||
""" | ||||
if not isinstance(nodes, set): | ||||
nodes = set(nodes) | ||||
if nullrev in nodes: | ||||
return set() | ||||
if len(nodes) <= 1: | ||||
return nodes | ||||
allseen = (1 << len(nodes)) - 1 | ||||
seen = [0] * (max(nodes) + 1) | ||||
for i, n in enumerate(nodes): | ||||
seen[n] = 1 << i | ||||
poison = 1 << (i + 1) | ||||
gca = set() | ||||
interesting = len(nodes) | ||||
nv = len(seen) - 1 | ||||
while nv >= 0 and interesting: | ||||
v = nv | ||||
nv -= 1 | ||||
if not seen[v]: | ||||
continue | ||||
sv = seen[v] | ||||
if sv < poison: | ||||
interesting -= 1 | ||||
if sv == allseen: | ||||
gca.add(v) | ||||
sv |= poison | ||||
if v in nodes: | ||||
# history is linear | ||||
Martin von Zweigbergk
|
r32291 | return {v} | ||
Mads Kiilerich
|
r21101 | if sv < poison: | ||
for p in pfunc(v): | ||||
sp = seen[p] | ||||
if p == nullrev: | ||||
continue | ||||
if sp == 0: | ||||
seen[p] = sv | ||||
interesting += 1 | ||||
elif sp != sv: | ||||
seen[p] |= sv | ||||
else: | ||||
for p in pfunc(v): | ||||
if p == nullrev: | ||||
continue | ||||
sp = seen[p] | ||||
if sp and sp < poison: | ||||
interesting -= 1 | ||||
seen[p] = sv | ||||
return gca | ||||
Augie Fackler
|
r43346 | |||
Bryan O'Sullivan
|
r18986 | def ancestors(pfunc, *orignodes): | ||
""" | ||||
Returns the common ancestors of a and b that are furthest from a | ||||
root (as measured by longest path). | ||||
pfunc must return a list of parent vertices for a given vertex. | ||||
""" | ||||
Augie Fackler
|
r43346 | |||
Bryan O'Sullivan
|
r18986 | def deepest(nodes): | ||
interesting = {} | ||||
count = max(nodes) + 1 | ||||
depth = [0] * count | ||||
seen = [0] * count | ||||
mapping = [] | ||||
Raphaël Gomès
|
r52596 | for i, n in enumerate(sorted(nodes)): | ||
Bryan O'Sullivan
|
r18986 | depth[n] = 1 | ||
b = 1 << i | ||||
seen[n] = b | ||||
interesting[b] = 1 | ||||
mapping.append((b, n)) | ||||
nv = count - 1 | ||||
while nv >= 0 and len(interesting) > 1: | ||||
v = nv | ||||
nv -= 1 | ||||
dv = depth[v] | ||||
if dv == 0: | ||||
continue | ||||
sv = seen[v] | ||||
for p in pfunc(v): | ||||
if p == nullrev: | ||||
continue | ||||
dp = depth[p] | ||||
Matt Harbison
|
r44421 | sp = seen[p] | ||
Bryan O'Sullivan
|
r18986 | if dp <= dv: | ||
depth[p] = dv + 1 | ||||
if sp != sv: | ||||
interesting[sv] += 1 | ||||
Matt Harbison
|
r44421 | seen[p] = sv | ||
Bryan O'Sullivan
|
r18986 | if sp: | ||
interesting[sp] -= 1 | ||||
if interesting[sp] == 0: | ||||
del interesting[sp] | ||||
elif dv == dp - 1: | ||||
nsp = sp | sv | ||||
if nsp == sp: | ||||
continue | ||||
seen[p] = nsp | ||||
interesting.setdefault(nsp, 0) | ||||
interesting[nsp] += 1 | ||||
interesting[sp] -= 1 | ||||
if interesting[sp] == 0: | ||||
del interesting[sp] | ||||
interesting[sv] -= 1 | ||||
if interesting[sv] == 0: | ||||
del interesting[sv] | ||||
if len(interesting) != 1: | ||||
return [] | ||||
k = 0 | ||||
for i in interesting: | ||||
k |= i | ||||
Augie Fackler
|
r44937 | return {n for (i, n) in mapping if k & i} | ||
Bryan O'Sullivan
|
r18986 | |||
Mads Kiilerich
|
r21101 | gca = commonancestorsheads(pfunc, *orignodes) | ||
Bryan O'Sullivan
|
r18986 | |||
if len(gca) <= 1: | ||||
return gca | ||||
return deepest(gca) | ||||
Augie Fackler
|
r43346 | |||
Gregory Szorc
|
r49801 | class incrementalmissingancestors: | ||
Augie Fackler
|
r46554 | """persistent state used to calculate missing ancestors incrementally | ||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23334 | Although similar in spirit to lazyancestors below, this is a separate class | ||
because trying to support contains and missingancestors operations with the | ||||
Augie Fackler
|
r46554 | same internal data structures adds needless complexity.""" | ||
Augie Fackler
|
r43346 | |||
Siddharth Agarwal
|
r23334 | def __init__(self, pfunc, bases): | ||
self.bases = set(bases) | ||||
if not self.bases: | ||||
self.bases.add(nullrev) | ||||
self.pfunc = pfunc | ||||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23340 | def hasbases(self): | ||
'''whether the common set has any non-trivial bases''' | ||||
Martin von Zweigbergk
|
r32291 | return self.bases and self.bases != {nullrev} | ||
Siddharth Agarwal
|
r23340 | |||
Siddharth Agarwal
|
r23341 | def addbases(self, newbases): | ||
'''grow the ancestor set by adding new bases''' | ||||
self.bases.update(newbases) | ||||
Georges Racinet
|
r41280 | def basesheads(self): | ||
return dagop.headrevs(self.bases, self.pfunc) | ||||
Siddharth Agarwal
|
r23342 | def removeancestorsfrom(self, revs): | ||
'''remove all ancestors of bases from the set revs (in place)''' | ||||
bases = self.bases | ||||
pfunc = self.pfunc | ||||
revs.difference_update(bases) | ||||
# nullrev is always an ancestor | ||||
revs.discard(nullrev) | ||||
if not revs: | ||||
return | ||||
# anything in revs > start is definitely not an ancestor of bases | ||||
# revs <= start needs to be investigated | ||||
start = max(bases) | ||||
keepcount = sum(1 for r in revs if r > start) | ||||
if len(revs) == keepcount: | ||||
# no revs to consider | ||||
return | ||||
Manuel Jacob
|
r50179 | for curr in range(start, min(revs) - 1, -1): | ||
Siddharth Agarwal
|
r23342 | if curr not in bases: | ||
continue | ||||
revs.discard(curr) | ||||
bases.update(pfunc(curr)) | ||||
if len(revs) == keepcount: | ||||
# no more potential revs to discard | ||||
break | ||||
Siddharth Agarwal
|
r23334 | def missingancestors(self, revs): | ||
Augie Fackler
|
r46554 | """return all the ancestors of revs that are not ancestors of self.bases | ||
Siddharth Agarwal
|
r23334 | |||
This may include elements from revs. | ||||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23334 | Equivalent to the revset (::revs - ::self.bases). Revs are returned in | ||
Augie Fackler
|
r46554 | revision number order, which is a topological order.""" | ||
Siddharth Agarwal
|
r23334 | revsvisit = set(revs) | ||
basesvisit = self.bases | ||||
pfunc = self.pfunc | ||||
bothvisit = revsvisit.intersection(basesvisit) | ||||
revsvisit.difference_update(bothvisit) | ||||
Siddharth Agarwal
|
r17970 | if not revsvisit: | ||
Siddharth Agarwal
|
r23334 | return [] | ||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23334 | start = max(max(revsvisit), max(basesvisit)) | ||
# At this point, we hold the invariants that: | ||||
# - revsvisit is the set of nodes we know are an ancestor of at least | ||||
# one of the nodes in revs | ||||
# - basesvisit is the same for bases | ||||
# - bothvisit is the set of nodes we know are ancestors of at least one | ||||
# of the nodes in revs and one of the nodes in bases. bothvisit and | ||||
# revsvisit are mutually exclusive, but bothvisit is a subset of | ||||
# basesvisit. | ||||
# Now we walk down in reverse topo order, adding parents of nodes | ||||
# already visited to the sets while maintaining the invariants. When a | ||||
# node is found in both revsvisit and basesvisit, it is removed from | ||||
# revsvisit and added to bothvisit. When revsvisit becomes empty, there | ||||
# are no more ancestors of revs that aren't also ancestors of bases, so | ||||
# exit. | ||||
missing = [] | ||||
Manuel Jacob
|
r50179 | for curr in range(start, nullrev, -1): | ||
Siddharth Agarwal
|
r23334 | if not revsvisit: | ||
break | ||||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23334 | if curr in bothvisit: | ||
bothvisit.remove(curr) | ||||
# curr's parents might have made it into revsvisit through | ||||
# another path | ||||
for p in pfunc(curr): | ||||
revsvisit.discard(p) | ||||
basesvisit.add(p) | ||||
bothvisit.add(p) | ||||
continue | ||||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23334 | if curr in revsvisit: | ||
missing.append(curr) | ||||
revsvisit.remove(curr) | ||||
thisvisit = revsvisit | ||||
othervisit = basesvisit | ||||
elif curr in basesvisit: | ||||
thisvisit = basesvisit | ||||
othervisit = revsvisit | ||||
Siddharth Agarwal
|
r17970 | else: | ||
Siddharth Agarwal
|
r23334 | # not an ancestor of revs or bases: ignore | ||
continue | ||||
Siddharth Agarwal
|
r17970 | |||
Siddharth Agarwal
|
r23334 | for p in pfunc(curr): | ||
if p == nullrev: | ||||
pass | ||||
elif p in othervisit or p in bothvisit: | ||||
# p is implicitly in thisvisit. This means p is or should be | ||||
# in bothvisit | ||||
revsvisit.discard(p) | ||||
basesvisit.add(p) | ||||
bothvisit.add(p) | ||||
else: | ||||
# visit later | ||||
thisvisit.add(p) | ||||
missing.reverse() | ||||
return missing | ||||
Augie Fackler
|
r43346 | |||
Martin von Zweigbergk
|
r39517 | # Extracted from lazyancestors.__iter__ to avoid a reference cycle | ||
def _lazyancestorsiter(parentrevs, initrevs, stoprev, inclusive): | ||||
seen = {nullrev} | ||||
Yuya Nishihara
|
r39573 | heappush = heapq.heappush | ||
heappop = heapq.heappop | ||||
Yuya Nishihara
|
r39574 | heapreplace = heapq.heapreplace | ||
Martin von Zweigbergk
|
r39517 | see = seen.add | ||
if inclusive: | ||||
Yuya Nishihara
|
r39569 | visit = [-r for r in initrevs] | ||
seen.update(initrevs) | ||||
Martin von Zweigbergk
|
r39517 | heapq.heapify(visit) | ||
else: | ||||
visit = [] | ||||
heapq.heapify(visit) | ||||
Yuya Nishihara
|
r39569 | for r in initrevs: | ||
Yuya Nishihara
|
r39571 | p1, p2 = parentrevs(r) | ||
if p1 not in seen: | ||||
Yuya Nishihara
|
r39573 | heappush(visit, -p1) | ||
Yuya Nishihara
|
r39571 | see(p1) | ||
if p2 not in seen: | ||||
Yuya Nishihara
|
r39573 | heappush(visit, -p2) | ||
Yuya Nishihara
|
r39571 | see(p2) | ||
Martin von Zweigbergk
|
r39517 | |||
while visit: | ||||
Yuya Nishihara
|
r39572 | current = -visit[0] | ||
Yuya Nishihara
|
r39570 | if current < stoprev: | ||
break | ||||
yield current | ||||
Yuya Nishihara
|
r39572 | # optimize out heapq operation if p1 is known to be the next highest | ||
# revision, which is quite common in linear history. | ||||
Yuya Nishihara
|
r39571 | p1, p2 = parentrevs(current) | ||
if p1 not in seen: | ||||
Yuya Nishihara
|
r39572 | if current - p1 == 1: | ||
visit[0] = -p1 | ||||
else: | ||||
Yuya Nishihara
|
r39574 | heapreplace(visit, -p1) | ||
Yuya Nishihara
|
r39571 | see(p1) | ||
Yuya Nishihara
|
r39572 | else: | ||
Yuya Nishihara
|
r39573 | heappop(visit) | ||
Yuya Nishihara
|
r39571 | if p2 not in seen: | ||
Yuya Nishihara
|
r39573 | heappush(visit, -p2) | ||
Yuya Nishihara
|
r39571 | see(p2) | ||
Martin von Zweigbergk
|
r39517 | |||
Augie Fackler
|
r43346 | |||
Gregory Szorc
|
r49801 | class lazyancestors: | ||
Siddharth Agarwal
|
r23328 | def __init__(self, pfunc, revs, stoprev=0, inclusive=False): | ||
Siddharth Agarwal
|
r18090 | """Create a new object generating ancestors for the given revs. Does | ||
not generate revs lower than stoprev. | ||||
Siddharth Agarwal
|
r18091 | This is computed lazily starting from revs. The object supports | ||
iteration and membership. | ||||
Siddharth Agarwal
|
r18090 | |||
cl should be a changelog and revs should be an iterable. inclusive is | ||||
a boolean that indicates whether revs should be included. Revs lower | ||||
than stoprev will not be generated. | ||||
Result does not include the null revision.""" | ||||
Siddharth Agarwal
|
r23328 | self._parentrevs = pfunc | ||
Matt Harbison
|
r44420 | self._initrevs = [r for r in revs if r >= stoprev] | ||
Siddharth Agarwal
|
r18090 | self._stoprev = stoprev | ||
self._inclusive = inclusive | ||||
Martin von Zweigbergk
|
r39518 | self._containsseen = set() | ||
Augie Fackler
|
r43346 | self._containsiter = _lazyancestorsiter( | ||
self._parentrevs, self._initrevs, self._stoprev, self._inclusive | ||||
) | ||||
Siddharth Agarwal
|
r18091 | |||
Pierre-Yves David
|
r22225 | def __nonzero__(self): | ||
"""False if the set is empty, True otherwise.""" | ||||
try: | ||||
timeless
|
r29216 | next(iter(self)) | ||
Pierre-Yves David
|
r22225 | return True | ||
except StopIteration: | ||||
return False | ||||
Gregory Szorc
|
r31476 | __bool__ = __nonzero__ | ||
Siddharth Agarwal
|
r18090 | def __iter__(self): | ||
"""Generate the ancestors of _initrevs in reverse topological order. | ||||
If inclusive is False, yield a sequence of revision numbers starting | ||||
Boris Feld
|
r39509 | with the parents of each revision in revs, i.e., each revision is | ||
*not* considered an ancestor of itself. Results are emitted in reverse | ||||
revision number order. That order is also topological: a child is | ||||
always emitted before its parent. | ||||
Siddharth Agarwal
|
r18090 | |||
Boris Feld
|
r39510 | If inclusive is True, the source revisions are also yielded. The | ||
reverse revision number order is still enforced.""" | ||||
Augie Fackler
|
r43346 | return _lazyancestorsiter( | ||
self._parentrevs, self._initrevs, self._stoprev, self._inclusive | ||||
) | ||||
Siddharth Agarwal
|
r18091 | |||
def __contains__(self, target): | ||||
"""Test whether target is an ancestor of self._initrevs.""" | ||||
seen = self._containsseen | ||||
if target in seen: | ||||
return True | ||||
Martin von Zweigbergk
|
r39518 | iter = self._containsiter | ||
if iter is None: | ||||
# Iterator exhausted | ||||
return False | ||||
Yuya Nishihara
|
r38614 | # Only integer target is valid, but some callers expect 'None in self' | ||
# to be False. So we explicitly allow it. | ||||
if target is None: | ||||
return False | ||||
Siddharth Agarwal
|
r18091 | |||
Pierre-Yves David
|
r25639 | see = seen.add | ||
Martin von Zweigbergk
|
r39518 | try: | ||
while True: | ||||
rev = next(iter) | ||||
see(rev) | ||||
if rev == target: | ||||
return True | ||||
if rev < target: | ||||
return False | ||||
except StopIteration: | ||||
# Set to None to indicate fast-path can be used next time, and to | ||||
# free up memory. | ||||
self._containsiter = None | ||||
return False | ||||