hbisect.py
339 lines
| 11.2 KiB
| text/x-python
|
PythonLexer
/ mercurial / hbisect.py
Matt Mackall
|
r5775 | # changelog bisection for mercurial | ||
# | ||||
Raphaël Gomès
|
r47575 | # Copyright 2007 Olivia Mackall | ||
Matt Mackall
|
r5775 | # Copyright 2005, 2006 Benoit Boissinot <benoit.boissinot@ens-lyon.org> | ||
Martin Geisler
|
r8228 | # | ||
Matt Mackall
|
r5775 | # Inspired by git bisect, extension skeleton taken from mq.py. | ||
# | ||||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Matt Mackall
|
r5775 | |||
Matt Harbison
|
r52755 | from __future__ import annotations | ||
Gregory Szorc
|
r25952 | |||
Martin von Zweigbergk
|
r25113 | import collections | ||
Denis Laxalde
|
r44064 | import contextlib | ||
Gregory Szorc
|
r25952 | |||
from .i18n import _ | ||||
from .node import ( | ||||
hex, | ||||
short, | ||||
) | ||||
Augie Fackler
|
r43346 | from . import error | ||
Matt Mackall
|
r5775 | |||
David Soria Parra
|
r35126 | def bisect(repo, state): | ||
Bernhard Leiner
|
r6858 | """find the next node (if any) for testing during a bisect search. | ||
returns a (nodes, number, good) tuple. | ||||
'nodes' is the final result of the bisect if 'number' is 0. | ||||
Otherwise 'number' indicates the remaining possible candidates for | ||||
the search and 'nodes' contains the next bisect target. | ||||
'good' is True if bisect is searching for a first good changeset, False | ||||
if searching for a first bad one. | ||||
""" | ||||
timeless
|
r42501 | repo = repo.unfiltered() | ||
David Soria Parra
|
r35126 | changelog = repo.changelog | ||
Matt Mackall
|
r5775 | clparents = changelog.parentrevs | ||
Augie Fackler
|
r43347 | skip = {changelog.rev(n) for n in state[b'skip']} | ||
Matt Mackall
|
r5775 | |||
Matt Mackall
|
r5776 | def buildancestors(bad, good): | ||
badrev = min([changelog.rev(n) for n in bad]) | ||||
David Soria Parra
|
r35128 | ancestors = collections.defaultdict(lambda: None) | ||
Arun Kulshreshtha
|
r50336 | for rev in repo.revs(b"(%ln::%d) - (::%ln)", good, badrev, good): | ||
Alexander Krauss
|
r14895 | ancestors[rev] = [] | ||
Matt Mackall
|
r5776 | if ancestors[badrev] is None: | ||
Matt Mackall
|
r5777 | return badrev, None | ||
Matt Mackall
|
r5776 | return badrev, ancestors | ||
Martin Geisler
|
r14215 | good = False | ||
Augie Fackler
|
r43347 | badrev, ancestors = buildancestors(state[b'bad'], state[b'good']) | ||
Augie Fackler
|
r43346 | if not ancestors: # looking for bad to good transition? | ||
Martin Geisler
|
r14215 | good = True | ||
Augie Fackler
|
r43347 | badrev, ancestors = buildancestors(state[b'good'], state[b'bad']) | ||
Matt Mackall
|
r5777 | bad = changelog.node(badrev) | ||
Augie Fackler
|
r43346 | if not ancestors: # now we're confused | ||
if ( | ||||
Augie Fackler
|
r43347 | len(state[b'bad']) == 1 | ||
and len(state[b'good']) == 1 | ||||
and state[b'bad'] != state[b'good'] | ||||
Augie Fackler
|
r43346 | ): | ||
Augie Fackler
|
r43347 | raise error.Abort(_(b"starting revisions are not directly related")) | ||
Augie Fackler
|
r43346 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b"inconsistent state, %d:%s is good and bad") | ||
Augie Fackler
|
r43346 | % (badrev, short(bad)) | ||
) | ||||
Matt Mackall
|
r5775 | |||
# build children dict | ||||
children = {} | ||||
Martin von Zweigbergk
|
r25113 | visit = collections.deque([badrev]) | ||
Matt Mackall
|
r5775 | candidates = [] | ||
while visit: | ||||
Bryan O'Sullivan
|
r16803 | rev = visit.popleft() | ||
Matt Mackall
|
r5775 | if ancestors[rev] == []: | ||
candidates.append(rev) | ||||
for prev in clparents(rev): | ||||
if prev != -1: | ||||
if prev in children: | ||||
children[prev].append(rev) | ||||
else: | ||||
children[prev] = [rev] | ||||
visit.append(prev) | ||||
candidates.sort() | ||||
# have we narrowed it down to one entry? | ||||
Bernhard Leiner
|
r6858 | # or have all other possible candidates besides 'bad' have been skipped? | ||
Matt Mackall
|
r5775 | tot = len(candidates) | ||
Bernhard Leiner
|
r6858 | unskipped = [c for c in candidates if (c not in skip) and (c != badrev)] | ||
if tot == 1 or not unskipped: | ||||
Augie Fackler
|
r30389 | return ([changelog.node(c) for c in candidates], 0, good) | ||
Benoit Boissinot
|
r7902 | perfect = tot // 2 | ||
Matt Mackall
|
r5775 | |||
# find the best node to test | ||||
best_rev = None | ||||
best_len = -1 | ||||
Benoit Boissinot
|
r8463 | poison = set() | ||
Matt Mackall
|
r5775 | for rev in candidates: | ||
if rev in poison: | ||||
Martin Geisler
|
r8482 | # poison children | ||
poison.update(children.get(rev, [])) | ||||
Matt Mackall
|
r5775 | continue | ||
a = ancestors[rev] or [rev] | ||||
ancestors[rev] = None | ||||
Augie Fackler
|
r43346 | x = len(a) # number of ancestors | ||
y = tot - x # number of non-ancestors | ||||
value = min(x, y) # how good is this test? | ||||
Matt Mackall
|
r5775 | if value > best_len and rev not in skip: | ||
best_len = value | ||||
best_rev = rev | ||||
Augie Fackler
|
r43346 | if value == perfect: # found a perfect candidate? quit early | ||
Matt Mackall
|
r5775 | break | ||
Augie Fackler
|
r43346 | if y < perfect and rev not in skip: # all downhill from here? | ||
Martin Geisler
|
r8482 | # poison children | ||
poison.update(children.get(rev, [])) | ||||
Matt Mackall
|
r5775 | continue | ||
Arun Kulshreshtha
|
r50386 | unvisited = [] | ||
Matt Mackall
|
r5775 | for c in children.get(rev, []): | ||
if ancestors[c]: | ||||
Martin Geisler
|
r8152 | ancestors[c] = list(set(ancestors[c] + a)) | ||
Matt Mackall
|
r5775 | else: | ||
Arun Kulshreshtha
|
r50386 | unvisited.append(c) | ||
# Reuse existing ancestor list for the first unvisited child to avoid | ||||
# excessive copying for linear portions of history. | ||||
if unvisited: | ||||
first = unvisited.pop(0) | ||||
for c in unvisited: | ||||
Matt Mackall
|
r5775 | ancestors[c] = a + [c] | ||
Arun Kulshreshtha
|
r50386 | a.append(first) | ||
ancestors[first] = a | ||||
Matt Mackall
|
r5775 | |||
assert best_rev is not None | ||||
best_node = changelog.node(best_rev) | ||||
Bernhard Leiner
|
r6858 | return ([best_node], tot, good) | ||
Alexander Solovyov
|
r7227 | |||
Augie Fackler
|
r43346 | |||
Pierre-Yves David
|
r30066 | def extendrange(repo, state, nodes, good): | ||
# bisect is incomplete when it ends on a merge node and | ||||
# one of the parent was not checked. | ||||
parents = repo[nodes[0]].parents() | ||||
if len(parents) > 1: | ||||
if good: | ||||
Augie Fackler
|
r43347 | side = state[b'bad'] | ||
Pierre-Yves David
|
r30066 | else: | ||
Augie Fackler
|
r43347 | side = state[b'good'] | ||
Augie Fackler
|
r44937 | num = len({i.node() for i in parents} & set(side)) | ||
Pierre-Yves David
|
r30066 | if num == 1: | ||
return parents[0].ancestor(parents[1]) | ||||
return None | ||||
Alexander Solovyov
|
r7227 | |||
Augie Fackler
|
r43346 | |||
Alexander Solovyov
|
r7227 | def load_state(repo): | ||
Augie Fackler
|
r43347 | state = {b'current': [], b'good': [], b'bad': [], b'skip': []} | ||
for l in repo.vfs.tryreadlines(b"bisect.state"): | ||||
Bryan O'Sullivan
|
r27525 | kind, node = l[:-1].split() | ||
timeless
|
r42501 | node = repo.unfiltered().lookup(node) | ||
Bryan O'Sullivan
|
r27525 | if kind not in state: | ||
Augie Fackler
|
r43347 | raise error.Abort(_(b"unknown bisect kind %s") % kind) | ||
Bryan O'Sullivan
|
r27525 | state[kind].append(node) | ||
Alexander Solovyov
|
r7227 | return state | ||
def save_state(repo, state): | ||||
Augie Fackler
|
r43347 | f = repo.vfs(b"bisect.state", b"w", atomictemp=True) | ||
Bryan O'Sullivan
|
r27853 | with repo.wlock(): | ||
Mads Kiilerich
|
r18358 | for kind in sorted(state): | ||
Alexander Solovyov
|
r7227 | for node in state[kind]: | ||
Augie Fackler
|
r43347 | f.write(b"%s %s\n" % (kind, hex(node))) | ||
Greg Ward
|
r15057 | f.close() | ||
Alexander Solovyov
|
r7227 | |||
Augie Fackler
|
r43346 | |||
Pierre-Yves David
|
r30065 | def resetstate(repo): | ||
"""remove any bisect state from the repository""" | ||||
Augie Fackler
|
r43347 | if repo.vfs.exists(b"bisect.state"): | ||
repo.vfs.unlink(b"bisect.state") | ||||
Pierre-Yves David
|
r30065 | |||
Augie Fackler
|
r43346 | |||
Pierre-Yves David
|
r30126 | def checkstate(state): | ||
"""check we have both 'good' and 'bad' to define a range | ||||
Martin von Zweigbergk
|
r46487 | Raise StateError exception otherwise.""" | ||
Augie Fackler
|
r43347 | if state[b'good'] and state[b'bad']: | ||
Pierre-Yves David
|
r30126 | return True | ||
Augie Fackler
|
r43347 | if not state[b'good']: | ||
Martin von Zweigbergk
|
r46487 | raise error.StateError(_(b'cannot bisect (no known good revisions)')) | ||
Pierre-Yves David
|
r30126 | else: | ||
Martin von Zweigbergk
|
r46487 | raise error.StateError(_(b'cannot bisect (no known bad revisions)')) | ||
Pierre-Yves David
|
r30126 | |||
Augie Fackler
|
r43346 | |||
Denis Laxalde
|
r44064 | @contextlib.contextmanager | ||
def restore_state(repo, state, node): | ||||
try: | ||||
yield | ||||
finally: | ||||
state[b'current'] = [node] | ||||
save_state(repo, state) | ||||
"Yann E. MORIN"
|
r15135 | def get(repo, status): | ||
""" | ||||
Return a list of revision(s) that match the given status: | ||||
"Yann E. MORIN"
|
r15153 | - ``good``, ``bad``, ``skip``: csets explicitly marked as good/bad/skip | ||
Mads Kiilerich
|
r17424 | - ``goods``, ``bads`` : csets topologically good/bad | ||
"Yann E. MORIN"
|
r15153 | - ``range`` : csets taking part in the bisection | ||
- ``pruned`` : csets that are goods, bads or skipped | ||||
"Yann E. MORIN"
|
r15138 | - ``untested`` : csets whose fate is yet unknown | ||
"Yann E. MORIN"
|
r15147 | - ``ignored`` : csets ignored due to DAG topology | ||
Bryan O'Sullivan
|
r16647 | - ``current`` : the cset currently being bisected | ||
"Yann E. MORIN"
|
r15135 | """ | ||
state = load_state(repo) | ||||
Augie Fackler
|
r43347 | if status in (b'good', b'bad', b'skip', b'current'): | ||
timeless
|
r42501 | return map(repo.unfiltered().changelog.rev, state[status]) | ||
"Yann E. MORIN"
|
r15135 | else: | ||
timeless@mozdev.org
|
r17493 | # In the following sets, we do *not* call 'bisect()' with more | ||
timeless@mozdev.org
|
r17509 | # than one level of recursion, because that can be very, very | ||
"Yann E. MORIN"
|
r15146 | # time consuming. Instead, we always develop the expression as | ||
# much as possible. | ||||
# 'range' is all csets that make the bisection: | ||||
# - have a good ancestor and a bad descendant, or conversely | ||||
# that's because the bisection can go either way | ||||
Augie Fackler
|
r43347 | range = b'( bisect(bad)::bisect(good) | bisect(good)::bisect(bad) )' | ||
"Yann E. MORIN"
|
r15136 | |||
Augie Fackler
|
r43347 | _t = repo.revs(b'bisect(good)::bisect(bad)') | ||
"Yann E. MORIN"
|
r15153 | # The sets of topologically good or bad csets | ||
if len(_t) == 0: | ||||
# Goods are topologically after bads | ||||
Augie Fackler
|
r43347 | goods = b'bisect(good)::' # Pruned good csets | ||
bads = b'::bisect(bad)' # Pruned bad csets | ||||
"Yann E. MORIN"
|
r15153 | else: | ||
# Goods are topologically before bads | ||||
Augie Fackler
|
r43347 | goods = b'::bisect(good)' # Pruned good csets | ||
bads = b'bisect(bad)::' # Pruned bad csets | ||||
"Yann E. MORIN"
|
r15153 | |||
# 'pruned' is all csets whose fate is already known: good, bad, skip | ||||
Augie Fackler
|
r43347 | skips = b'bisect(skip)' # Pruned skipped csets | ||
pruned = b'( (%s) | (%s) | (%s) )' % (goods, bads, skips) | ||||
"Yann E. MORIN"
|
r15136 | |||
"Yann E. MORIN"
|
r15146 | # 'untested' is all cset that are- in 'range', but not in 'pruned' | ||
Augie Fackler
|
r43347 | untested = b'( (%s) - (%s) )' % (range, pruned) | ||
"Yann E. MORIN"
|
r15136 | |||
"Yann E. MORIN"
|
r15147 | # 'ignored' is all csets that were not used during the bisection | ||
# due to DAG topology, but may however have had an impact. | ||||
Mads Kiilerich
|
r17424 | # E.g., a branch merged between bads and goods, but whose branch- | ||
"Yann E. MORIN"
|
r15147 | # point is out-side of the range. | ||
Augie Fackler
|
r43347 | iba = b'::bisect(bad) - ::bisect(good)' # Ignored bads' ancestors | ||
iga = b'::bisect(good) - ::bisect(bad)' # Ignored goods' ancestors | ||||
ignored = b'( ( (%s) | (%s) ) - (%s) )' % (iba, iga, range) | ||||
"Yann E. MORIN"
|
r15147 | |||
Augie Fackler
|
r43347 | if status == b'range': | ||
Matt Mackall
|
r15404 | return repo.revs(range) | ||
Augie Fackler
|
r43347 | elif status == b'pruned': | ||
Matt Mackall
|
r15404 | return repo.revs(pruned) | ||
Augie Fackler
|
r43347 | elif status == b'untested': | ||
Matt Mackall
|
r15404 | return repo.revs(untested) | ||
Augie Fackler
|
r43347 | elif status == b'ignored': | ||
Matt Mackall
|
r15404 | return repo.revs(ignored) | ||
Augie Fackler
|
r43347 | elif status == b"goods": | ||
Matt Mackall
|
r15404 | return repo.revs(goods) | ||
Augie Fackler
|
r43347 | elif status == b"bads": | ||
Matt Mackall
|
r15404 | return repo.revs(bads) | ||
"Yann E. MORIN"
|
r15136 | else: | ||
Augie Fackler
|
r43347 | raise error.ParseError(_(b'invalid bisect state')) | ||
"Yann E. MORIN"
|
r15154 | |||
Augie Fackler
|
r43346 | |||
"Yann E. MORIN"
|
r15406 | def label(repo, node): | ||
"Yann E. MORIN"
|
r15154 | rev = repo.changelog.rev(node) | ||
# Try explicit sets | ||||
Augie Fackler
|
r43347 | if rev in get(repo, b'good'): | ||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'good') | ||
if rev in get(repo, b'bad'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'bad') | ||
if rev in get(repo, b'skip'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'skipped') | ||
if rev in get(repo, b'untested') or rev in get(repo, b'current'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'untested') | ||
if rev in get(repo, b'ignored'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'ignored') | ||
"Yann E. MORIN"
|
r15154 | |||
# Try implicit sets | ||||
Augie Fackler
|
r43347 | if rev in get(repo, b'goods'): | ||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'good (implicit)') | ||
if rev in get(repo, b'bads'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
Augie Fackler
|
r43347 | return _(b'bad (implicit)') | ||
"Yann E. MORIN"
|
r15154 | |||
return None | ||||
Augie Fackler
|
r43346 | |||
Pierre-Yves David
|
r30067 | def printresult(ui, repo, state, displayer, nodes, good): | ||
timeless
|
r42501 | repo = repo.unfiltered() | ||
Pierre-Yves David
|
r30067 | if len(nodes) == 1: | ||
# narrowed it down to a single revision | ||||
if good: | ||||
Augie Fackler
|
r43347 | ui.write(_(b"The first good revision is:\n")) | ||
Pierre-Yves David
|
r30067 | else: | ||
Augie Fackler
|
r43347 | ui.write(_(b"The first bad revision is:\n")) | ||
Pierre-Yves David
|
r30067 | displayer.show(repo[nodes[0]]) | ||
extendnode = extendrange(repo, state, nodes, good) | ||||
if extendnode is not None: | ||||
Augie Fackler
|
r43346 | ui.write( | ||
_( | ||||
Augie Fackler
|
r43347 | b'Not all ancestors of this changeset have been' | ||
b' checked.\nUse bisect --extend to continue the ' | ||||
b'bisection from\nthe common ancestor, %s.\n' | ||||
Augie Fackler
|
r43346 | ) | ||
% extendnode | ||||
) | ||||
Pierre-Yves David
|
r30067 | else: | ||
# multiple possible revisions | ||||
if good: | ||||
Augie Fackler
|
r43346 | ui.write( | ||
_( | ||||
Augie Fackler
|
r43347 | b"Due to skipped revisions, the first " | ||
b"good revision could be any of:\n" | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Pierre-Yves David
|
r30067 | else: | ||
Augie Fackler
|
r43346 | ui.write( | ||
_( | ||||
Augie Fackler
|
r43347 | b"Due to skipped revisions, the first " | ||
b"bad revision could be any of:\n" | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Pierre-Yves David
|
r30067 | for n in nodes: | ||
displayer.show(repo[n]) | ||||
displayer.close() | ||||