hbisect.py
258 lines
| 9.0 KiB
| text/x-python
|
PythonLexer
/ mercurial / hbisect.py
Matt Mackall
|
r5775 | # changelog bisection for mercurial | ||
# | ||||
# Copyright 2007 Matt Mackall | ||||
# Copyright 2005, 2006 Benoit Boissinot <benoit.boissinot@ens-lyon.org> | ||||
Martin Geisler
|
r8228 | # | ||
Matt Mackall
|
r5775 | # Inspired by git bisect, extension skeleton taken from mq.py. | ||
# | ||||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Matt Mackall
|
r5775 | |||
"Yann E. MORIN"
|
r15135 | import os, error | ||
Matt Mackall
|
r5775 | from i18n import _ | ||
Alexander Solovyov
|
r7227 | from node import short, hex | ||
Bryan O'Sullivan
|
r16834 | import util | ||
Matt Mackall
|
r5775 | |||
def bisect(changelog, state): | ||||
Bernhard Leiner
|
r6858 | """find the next node (if any) for testing during a bisect search. | ||
returns a (nodes, number, good) tuple. | ||||
'nodes' is the final result of the bisect if 'number' is 0. | ||||
Otherwise 'number' indicates the remaining possible candidates for | ||||
the search and 'nodes' contains the next bisect target. | ||||
'good' is True if bisect is searching for a first good changeset, False | ||||
if searching for a first bad one. | ||||
""" | ||||
Matt Mackall
|
r5775 | clparents = changelog.parentrevs | ||
Martin Geisler
|
r8152 | skip = set([changelog.rev(n) for n in state['skip']]) | ||
Matt Mackall
|
r5775 | |||
Matt Mackall
|
r5776 | def buildancestors(bad, good): | ||
# only the earliest bad revision matters | ||||
badrev = min([changelog.rev(n) for n in bad]) | ||||
goodrevs = [changelog.rev(n) for n in good] | ||||
Matt Mackall
|
r9583 | goodrev = min(goodrevs) | ||
# build visit array | ||||
ancestors = [None] * (len(changelog) + 1) # an extra for [-1] | ||||
Alexander Krauss
|
r14895 | # set nodes descended from goodrevs | ||
for rev in goodrevs: | ||||
ancestors[rev] = [] | ||||
Matt Mackall
|
r9583 | for rev in xrange(goodrev + 1, len(changelog)): | ||
for prev in clparents(rev): | ||||
if ancestors[prev] == []: | ||||
ancestors[rev] = [] | ||||
Matt Mackall
|
r5775 | |||
Matt Mackall
|
r5776 | # clear good revs from array | ||
Alexander Krauss
|
r14894 | for rev in goodrevs: | ||
ancestors[rev] = None | ||||
Alexander Krauss
|
r14893 | for rev in xrange(len(changelog), goodrev, -1): | ||
Matt Mackall
|
r5776 | if ancestors[rev] is None: | ||
for prev in clparents(rev): | ||||
ancestors[prev] = None | ||||
Matt Mackall
|
r5775 | |||
Matt Mackall
|
r5776 | if ancestors[badrev] is None: | ||
Matt Mackall
|
r5777 | return badrev, None | ||
Matt Mackall
|
r5776 | return badrev, ancestors | ||
Martin Geisler
|
r14215 | good = False | ||
Matt Mackall
|
r5776 | badrev, ancestors = buildancestors(state['bad'], state['good']) | ||
if not ancestors: # looking for bad to good transition? | ||||
Martin Geisler
|
r14215 | good = True | ||
Matt Mackall
|
r5776 | badrev, ancestors = buildancestors(state['good'], state['bad']) | ||
Matt Mackall
|
r5777 | bad = changelog.node(badrev) | ||
Matt Mackall
|
r5776 | if not ancestors: # now we're confused | ||
Matt Mackall
|
r12005 | if len(state['bad']) == 1 and len(state['good']) == 1: | ||
raise util.Abort(_("starting revisions are not directly related")) | ||||
Martin Geisler
|
r12067 | raise util.Abort(_("inconsistent state, %s:%s is good and bad") | ||
Joel Rosdahl
|
r6217 | % (badrev, short(bad))) | ||
Matt Mackall
|
r5775 | |||
# build children dict | ||||
children = {} | ||||
Bryan O'Sullivan
|
r16834 | visit = util.deque([badrev]) | ||
Matt Mackall
|
r5775 | candidates = [] | ||
while visit: | ||||
Bryan O'Sullivan
|
r16803 | rev = visit.popleft() | ||
Matt Mackall
|
r5775 | if ancestors[rev] == []: | ||
candidates.append(rev) | ||||
for prev in clparents(rev): | ||||
if prev != -1: | ||||
if prev in children: | ||||
children[prev].append(rev) | ||||
else: | ||||
children[prev] = [rev] | ||||
visit.append(prev) | ||||
candidates.sort() | ||||
# have we narrowed it down to one entry? | ||||
Bernhard Leiner
|
r6858 | # or have all other possible candidates besides 'bad' have been skipped? | ||
Matt Mackall
|
r5775 | tot = len(candidates) | ||
Bernhard Leiner
|
r6858 | unskipped = [c for c in candidates if (c not in skip) and (c != badrev)] | ||
if tot == 1 or not unskipped: | ||||
return ([changelog.node(rev) for rev in candidates], 0, good) | ||||
Benoit Boissinot
|
r7902 | perfect = tot // 2 | ||
Matt Mackall
|
r5775 | |||
# find the best node to test | ||||
best_rev = None | ||||
best_len = -1 | ||||
Benoit Boissinot
|
r8463 | poison = set() | ||
Matt Mackall
|
r5775 | for rev in candidates: | ||
if rev in poison: | ||||
Martin Geisler
|
r8482 | # poison children | ||
poison.update(children.get(rev, [])) | ||||
Matt Mackall
|
r5775 | continue | ||
a = ancestors[rev] or [rev] | ||||
ancestors[rev] = None | ||||
x = len(a) # number of ancestors | ||||
y = tot - x # number of non-ancestors | ||||
value = min(x, y) # how good is this test? | ||||
if value > best_len and rev not in skip: | ||||
best_len = value | ||||
best_rev = rev | ||||
if value == perfect: # found a perfect candidate? quit early | ||||
break | ||||
Bernhard Leiner
|
r7557 | if y < perfect and rev not in skip: # all downhill from here? | ||
Martin Geisler
|
r8482 | # poison children | ||
poison.update(children.get(rev, [])) | ||||
Matt Mackall
|
r5775 | continue | ||
for c in children.get(rev, []): | ||||
if ancestors[c]: | ||||
Martin Geisler
|
r8152 | ancestors[c] = list(set(ancestors[c] + a)) | ||
Matt Mackall
|
r5775 | else: | ||
ancestors[c] = a + [c] | ||||
assert best_rev is not None | ||||
best_node = changelog.node(best_rev) | ||||
Bernhard Leiner
|
r6858 | return ([best_node], tot, good) | ||
Alexander Solovyov
|
r7227 | |||
def load_state(repo): | ||||
Bryan O'Sullivan
|
r16647 | state = {'current': [], 'good': [], 'bad': [], 'skip': []} | ||
Alexander Solovyov
|
r7227 | if os.path.exists(repo.join("bisect.state")): | ||
for l in repo.opener("bisect.state"): | ||||
kind, node = l[:-1].split() | ||||
node = repo.lookup(node) | ||||
if kind not in state: | ||||
raise util.Abort(_("unknown bisect kind %s") % kind) | ||||
state[kind].append(node) | ||||
return state | ||||
def save_state(repo, state): | ||||
f = repo.opener("bisect.state", "w", atomictemp=True) | ||||
wlock = repo.wlock() | ||||
try: | ||||
for kind in state: | ||||
for node in state[kind]: | ||||
f.write("%s %s\n" % (kind, hex(node))) | ||||
Greg Ward
|
r15057 | f.close() | ||
Alexander Solovyov
|
r7227 | finally: | ||
Ronny Pfannschmidt
|
r8109 | wlock.release() | ||
Alexander Solovyov
|
r7227 | |||
"Yann E. MORIN"
|
r15135 | def get(repo, status): | ||
""" | ||||
Return a list of revision(s) that match the given status: | ||||
"Yann E. MORIN"
|
r15153 | - ``good``, ``bad``, ``skip``: csets explicitly marked as good/bad/skip | ||
- ``goods``, ``bads`` : csets topologicaly good/bad | ||||
- ``range`` : csets taking part in the bisection | ||||
- ``pruned`` : csets that are goods, bads or skipped | ||||
"Yann E. MORIN"
|
r15138 | - ``untested`` : csets whose fate is yet unknown | ||
"Yann E. MORIN"
|
r15147 | - ``ignored`` : csets ignored due to DAG topology | ||
Bryan O'Sullivan
|
r16647 | - ``current`` : the cset currently being bisected | ||
"Yann E. MORIN"
|
r15135 | """ | ||
state = load_state(repo) | ||||
Bryan O'Sullivan
|
r16647 | if status in ('good', 'bad', 'skip', 'current'): | ||
return map(repo.changelog.rev, state[status]) | ||||
"Yann E. MORIN"
|
r15135 | else: | ||
"Yann E. MORIN"
|
r15146 | # In the floowing sets, we do *not* call 'bisect()' with more | ||
# than one level of recusrsion, because that can be very, very | ||||
# time consuming. Instead, we always develop the expression as | ||||
# much as possible. | ||||
# 'range' is all csets that make the bisection: | ||||
# - have a good ancestor and a bad descendant, or conversely | ||||
# that's because the bisection can go either way | ||||
range = '( bisect(bad)::bisect(good) | bisect(good)::bisect(bad) )' | ||||
"Yann E. MORIN"
|
r15136 | |||
Matt Mackall
|
r15404 | _t = repo.revs('bisect(good)::bisect(bad)') | ||
"Yann E. MORIN"
|
r15153 | # The sets of topologically good or bad csets | ||
if len(_t) == 0: | ||||
# Goods are topologically after bads | ||||
goods = 'bisect(good)::' # Pruned good csets | ||||
bads = '::bisect(bad)' # Pruned bad csets | ||||
else: | ||||
# Goods are topologically before bads | ||||
goods = '::bisect(good)' # Pruned good csets | ||||
bads = 'bisect(bad)::' # Pruned bad csets | ||||
# 'pruned' is all csets whose fate is already known: good, bad, skip | ||||
skips = 'bisect(skip)' # Pruned skipped csets | ||||
pruned = '( (%s) | (%s) | (%s) )' % (goods, bads, skips) | ||||
"Yann E. MORIN"
|
r15136 | |||
"Yann E. MORIN"
|
r15146 | # 'untested' is all cset that are- in 'range', but not in 'pruned' | ||
untested = '( (%s) - (%s) )' % (range, pruned) | ||||
"Yann E. MORIN"
|
r15136 | |||
"Yann E. MORIN"
|
r15147 | # 'ignored' is all csets that were not used during the bisection | ||
# due to DAG topology, but may however have had an impact. | ||||
# Eg., a branch merged between bads and goods, but whose branch- | ||||
# point is out-side of the range. | ||||
iba = '::bisect(bad) - ::bisect(good)' # Ignored bads' ancestors | ||||
iga = '::bisect(good) - ::bisect(bad)' # Ignored goods' ancestors | ||||
ignored = '( ( (%s) | (%s) ) - (%s) )' % (iba, iga, range) | ||||
"Yann E. MORIN"
|
r15136 | if status == 'range': | ||
Matt Mackall
|
r15404 | return repo.revs(range) | ||
"Yann E. MORIN"
|
r15137 | elif status == 'pruned': | ||
Matt Mackall
|
r15404 | return repo.revs(pruned) | ||
"Yann E. MORIN"
|
r15138 | elif status == 'untested': | ||
Matt Mackall
|
r15404 | return repo.revs(untested) | ||
"Yann E. MORIN"
|
r15147 | elif status == 'ignored': | ||
Matt Mackall
|
r15404 | return repo.revs(ignored) | ||
"Yann E. MORIN"
|
r15153 | elif status == "goods": | ||
Matt Mackall
|
r15404 | return repo.revs(goods) | ||
"Yann E. MORIN"
|
r15153 | elif status == "bads": | ||
Matt Mackall
|
r15404 | return repo.revs(bads) | ||
"Yann E. MORIN"
|
r15136 | else: | ||
raise error.ParseError(_('invalid bisect state')) | ||||
"Yann E. MORIN"
|
r15154 | |||
"Yann E. MORIN"
|
r15406 | def label(repo, node): | ||
"Yann E. MORIN"
|
r15154 | rev = repo.changelog.rev(node) | ||
# Try explicit sets | ||||
if rev in get(repo, 'good'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('good') | ||
if rev in get(repo, 'bad'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('bad') | ||
if rev in get(repo, 'skip'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('skipped') | ||
Bryan O'Sullivan
|
r16647 | if rev in get(repo, 'untested') or rev in get(repo, 'current'): | ||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('untested') | ||
if rev in get(repo, 'ignored'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('ignored') | ||
# Try implicit sets | ||||
if rev in get(repo, 'goods'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('good (implicit)') | ||
if rev in get(repo, 'bads'): | ||||
Wagner Bruna
|
r15308 | # i18n: bisect changeset status | ||
"Yann E. MORIN"
|
r15154 | return _('bad (implicit)') | ||
return None | ||||
def shortlabel(label): | ||||
if label: | ||||
return label[0].upper() | ||||
return None | ||||