upstream/mercurial-mirror Commit - r39366:655b5b46

revlog: split functionality related to deltas computation in a new module...

Boris Feld -

r39366:655b5b46 default

parent child

mercurial/debugcommands.py

0 +5 -1

             # debugcommands.py - command processing for debug* commands
             #
             # Copyright 2005-2016 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import codecs
             import collections
             import difflib
             import errno
             import operator
             import os
             import random
             import re
             import socket
             import ssl
             import stat
             import string
             import subprocess
             import sys
             import time
             from .i18n import _
             from .node import (
                 bin,
                 hex,
                 nullhex,
                 nullid,
                 nullrev,
                 short,
             )
             from .thirdparty import (
                 cbor,
             )
             from . import (
                 bundle2,
                 changegroup,
                 cmdutil,
                 color,
                 context,
                 dagparser,
                 encoding,
                 error,
                 exchange,
                 extensions,
                 filemerge,
                 filesetlang,
                 formatter,
                 hg,
                 httppeer,
                 localrepo,
                 lock as lockmod,
                 logcmdutil,
                 merge as mergemod,
                 obsolete,
                 obsutil,
                 phases,
                 policy,
                 pvec,
                 pycompat,
                 registrar,
                 repair,
                 revlog,
                 revset,
                 revsetlang,
                 scmutil,
                 setdiscovery,
                 simplemerge,
                 sshpeer,
                 sslutil,
                 streamclone,
                 templater,
                 treediscovery,
                 upgrade,
                 url as urlmod,
                 util,
                 vfs as vfsmod,
                 wireprotoframing,
                 wireprotoserver,
                 wireprotov2peer,
             )
             from .utils import (
                 dateutil,
                 procutil,
                 stringutil,
             )
+            from .revlogutils import (
+                deltas as deltautil
+            )
             release = lockmod.release
             command = registrar.command()
             @command('debugancestor', [], _('[INDEX] REV1 REV2'), optionalrepo=True)
             def debugancestor(ui, repo, *args):
                 """find the ancestor revision of two revisions in a given index"""
                 if len(args) == 3:
                     index, rev1, rev2 = args
                     r = revlog.revlog(vfsmod.vfs(pycompat.getcwd(), audit=False), index)
                     lookup = r.lookup
                 elif len(args) == 2:
                     if not repo:
                         raise error.Abort(_('there is no Mercurial repository here '
                                             '(.hg not found)'))
                     rev1, rev2 = args
                     r = repo.changelog
                     lookup = repo.lookup
                 else:
                     raise error.Abort(_('either two or three arguments required'))
                 a = r.ancestor(lookup(rev1), lookup(rev2))
                 ui.write('%d:%s\n' % (r.rev(a), hex(a)))
             @command('debugapplystreamclonebundle', [], 'FILE')
             def debugapplystreamclonebundle(ui, repo, fname):
                 """apply a stream clone bundle file"""
                 f = hg.openpath(ui, fname)
                 gen = exchange.readbundle(ui, f, fname)
                 gen.apply(repo)
             @command('debugbuilddag',
                 [('m', 'mergeable-file', None, _('add single file mergeable changes')),
                 ('o', 'overwritten-file', None, _('add single file all revs overwrite')),
                 ('n', 'new-file', None, _('add new file at each rev'))],
                 _('[OPTION]... [TEXT]'))
             def debugbuilddag(ui, repo, text=None,
                               mergeable_file=False,
                               overwritten_file=False,
                               new_file=False):
                 """builds a repo with a given DAG from scratch in the current empty repo
                 The description of the DAG is read from stdin if not given on the
                 command line.
                 Elements:
                  - "+n" is a linear run of n nodes based on the current default parent
                  - "." is a single node based on the current default parent
                  - "$" resets the default parent to null (implied at the start);
                        otherwise the default parent is always the last node created
                  - "<p" sets the default parent to the backref p
                  - "*p" is a fork at parent p, which is a backref
                  - "*p1/p2" is a merge of parents p1 and p2, which are backrefs
                  - "/p2" is a merge of the preceding node and p2
                  - ":tag" defines a local tag for the preceding node
                  - "@branch" sets the named branch for subsequent nodes
                  - "#...\\n" is a comment up to the end of the line
                 Whitespace between the above elements is ignored.
                 A backref is either
                  - a number n, which references the node curr-n, where curr is the current
                    node, or
                  - the name of a local tag you placed earlier using ":tag", or
                  - empty to denote the default parent.
                 All string valued-elements are either strictly alphanumeric, or must
                 be enclosed in double quotes ("..."), with "\\" as escape character.
                 """
                 if text is None:
                     ui.status(_("reading DAG from stdin\n"))
                     text = ui.fin.read()
                 cl = repo.changelog
                 if len(cl) > 0:
                     raise error.Abort(_('repository is not empty'))
                 # determine number of revs in DAG
                 total = 0
                 for type, data in dagparser.parsedag(text):
                     if type == 'n':
                         total += 1
                 if mergeable_file:
                     linesperrev = 2
                     # make a file with k lines per rev
                     initialmergedlines = ['%d' % i
                                           for i in pycompat.xrange(0, total * linesperrev)]
                     initialmergedlines.append("")
                 tags = []
                 progress = ui.makeprogress(_('building'), unit=_('revisions'),
                                            total=total)
                 with progress, repo.wlock(), repo.lock(), repo.transaction("builddag"):
                     at = -1
                     atbranch = 'default'
                     nodeids = []
                     id = 0
                     progress.update(id)
                     for type, data in dagparser.parsedag(text):
                         if type == 'n':
                             ui.note(('node %s\n' % pycompat.bytestr(data)))
                             id, ps = data
                             files = []
                             filecontent = {}
                             p2 = None
                             if mergeable_file:
                                 fn = "mf"
                                 p1 = repo[ps[0]]
                                 if len(ps) > 1:
                                     p2 = repo[ps[1]]
                                     pa = p1.ancestor(p2)
                                     base, local, other = [x[fn].data() for x in (pa, p1,
                                                                                  p2)]
                                     m3 = simplemerge.Merge3Text(base, local, other)
                                     ml = [l.strip() for l in m3.merge_lines()]
                                     ml.append("")
                                 elif at > 0:
                                     ml = p1[fn].data().split("\n")
                                 else:
                                     ml = initialmergedlines
                                 ml[id * linesperrev] += " r%i" % id
                                 mergedtext = "\n".join(ml)
                                 files.append(fn)
                                 filecontent[fn] = mergedtext
                             if overwritten_file:
                                 fn = "of"
                                 files.append(fn)
                                 filecontent[fn] = "r%i\n" % id
                             if new_file:
                                 fn = "nf%i" % id
                                 files.append(fn)
                                 filecontent[fn] = "r%i\n" % id
                                 if len(ps) > 1:
                                     if not p2:
                                         p2 = repo[ps[1]]
                                     for fn in p2:
                                         if fn.startswith("nf"):
                                             files.append(fn)
                                             filecontent[fn] = p2[fn].data()
                             def fctxfn(repo, cx, path):
                                 if path in filecontent:
                                     return context.memfilectx(repo, cx, path,
                                                               filecontent[path])
                                 return None
                             if len(ps) == 0 or ps[0] < 0:
                                 pars = [None, None]
                             elif len(ps) == 1:
                                 pars = [nodeids[ps[0]], None]
                             else:
                                 pars = [nodeids[p] for p in ps]
                             cx = context.memctx(repo, pars, "r%i" % id, files, fctxfn,
                                                 date=(id, 0),
                                                 user="debugbuilddag",
                                                 extra={'branch': atbranch})
                             nodeid = repo.commitctx(cx)
                             nodeids.append(nodeid)
                             at = id
                         elif type == 'l':
                             id, name = data
                             ui.note(('tag %s\n' % name))
                             tags.append("%s %s\n" % (hex(repo.changelog.node(id)), name))
                         elif type == 'a':
                             ui.note(('branch %s\n' % data))
                             atbranch = data
                         progress.update(id)
                     if tags:
                         repo.vfs.write("localtags", "".join(tags))
             def _debugchangegroup(ui, gen, all=None, indent=0, **opts):
                 indent_string = ' ' * indent
                 if all:
                     ui.write(("%sformat: id, p1, p2, cset, delta base, len(delta)\n")
                              % indent_string)
                     def showchunks(named):
                         ui.write("\n%s%s\n" % (indent_string, named))
                         for deltadata in gen.deltaiter():
                             node, p1, p2, cs, deltabase, delta, flags = deltadata
                             ui.write("%s%s %s %s %s %s %d\n" %
                                      (indent_string, hex(node), hex(p1), hex(p2),
                                       hex(cs), hex(deltabase), len(delta)))
                     chunkdata = gen.changelogheader()
                     showchunks("changelog")
                     chunkdata = gen.manifestheader()
                     showchunks("manifest")
                     for chunkdata in iter(gen.filelogheader, {}):
                         fname = chunkdata['filename']
                         showchunks(fname)
                 else:
                     if isinstance(gen, bundle2.unbundle20):
                         raise error.Abort(_('use debugbundle2 for this file'))
                     chunkdata = gen.changelogheader()
                     for deltadata in gen.deltaiter():
                         node, p1, p2, cs, deltabase, delta, flags = deltadata
                         ui.write("%s%s\n" % (indent_string, hex(node)))
             def _debugobsmarkers(ui, part, indent=0, **opts):
                 """display version and markers contained in 'data'"""
                 opts = pycompat.byteskwargs(opts)
                 data = part.read()
                 indent_string = ' ' * indent
                 try:
                     version, markers = obsolete._readmarkers(data)
                 except error.UnknownVersion as exc:
                     msg = "%sunsupported version: %s (%d bytes)\n"
                     msg %= indent_string, exc.version, len(data)
                     ui.write(msg)
                 else:
                     msg = "%sversion: %d (%d bytes)\n"
                     msg %= indent_string, version, len(data)
                     ui.write(msg)
                     fm = ui.formatter('debugobsolete', opts)
                     for rawmarker in sorted(markers):
                         m = obsutil.marker(None, rawmarker)
                         fm.startitem()
                         fm.plain(indent_string)
                         cmdutil.showmarker(fm, m)
                     fm.end()
             def _debugphaseheads(ui, data, indent=0):
                 """display version and markers contained in 'data'"""
                 indent_string = ' ' * indent
                 headsbyphase = phases.binarydecode(data)
                 for phase in phases.allphases:
                     for head in headsbyphase[phase]:
                         ui.write(indent_string)
                         ui.write('%s %s\n' % (hex(head), phases.phasenames[phase]))
             def _quasirepr(thing):
                 if isinstance(thing, (dict, util.sortdict, collections.OrderedDict)):
                     return '{%s}' % (
                         b', '.join(b'%s: %s' % (k, thing[k]) for k in sorted(thing)))
                 return pycompat.bytestr(repr(thing))
             def _debugbundle2(ui, gen, all=None, **opts):
                 """lists the contents of a bundle2"""
                 if not isinstance(gen, bundle2.unbundle20):
                     raise error.Abort(_('not a bundle2 file'))
                 ui.write(('Stream params: %s\n' % _quasirepr(gen.params)))
                 parttypes = opts.get(r'part_type', [])
                 for part in gen.iterparts():
                     if parttypes and part.type not in parttypes:
                         continue
                     msg = '%s -- %s (mandatory: %r)\n'
                     ui.write((msg % (part.type, _quasirepr(part.params), part.mandatory)))
                     if part.type == 'changegroup':
                         version = part.params.get('version', '01')
                         cg = changegroup.getunbundler(version, part, 'UN')
                         if not ui.quiet:
                             _debugchangegroup(ui, cg, all=all, indent=4, **opts)
                     if part.type == 'obsmarkers':
                         if not ui.quiet:
                             _debugobsmarkers(ui, part, indent=4, **opts)
                     if part.type == 'phase-heads':
                         if not ui.quiet:
                             _debugphaseheads(ui, part, indent=4)
             @command('debugbundle',
                     [('a', 'all', None, _('show all details')),
                      ('', 'part-type', [], _('show only the named part type')),
                      ('', 'spec', None, _('print the bundlespec of the bundle'))],
                     _('FILE'),
                     norepo=True)
             def debugbundle(ui, bundlepath, all=None, spec=None, **opts):
                 """lists the contents of a bundle"""
                 with hg.openpath(ui, bundlepath) as f:
                     if spec:
                         spec = exchange.getbundlespec(ui, f)
                         ui.write('%s\n' % spec)
                         return
                     gen = exchange.readbundle(ui, f, bundlepath)
                     if isinstance(gen, bundle2.unbundle20):
                         return _debugbundle2(ui, gen, all=all, **opts)
                     _debugchangegroup(ui, gen, all=all, **opts)
             @command('debugcapabilities',
                     [], _('PATH'),
                     norepo=True)
             def debugcapabilities(ui, path, **opts):
                 """lists the capabilities of a remote peer"""
                 opts = pycompat.byteskwargs(opts)
                 peer = hg.peer(ui, opts, path)
                 caps = peer.capabilities()
                 ui.write(('Main capabilities:\n'))
                 for c in sorted(caps):
                     ui.write(('  %s\n') % c)
                 b2caps = bundle2.bundle2caps(peer)
                 if b2caps:
                     ui.write(('Bundle2 capabilities:\n'))
                     for key, values in sorted(b2caps.iteritems()):
                         ui.write(('  %s\n') % key)
                         for v in values:
                             ui.write(('    %s\n') % v)
             @command('debugcheckstate', [], '')
             def debugcheckstate(ui, repo):
                 """validate the correctness of the current dirstate"""
                 parent1, parent2 = repo.dirstate.parents()
                 m1 = repo[parent1].manifest()
                 m2 = repo[parent2].manifest()
                 errors = 0
                 for f in repo.dirstate:
                     state = repo.dirstate[f]
                     if state in "nr" and f not in m1:
                         ui.warn(_("%s in state %s, but not in manifest1\n") % (f, state))
                         errors += 1
                     if state in "a" and f in m1:
                         ui.warn(_("%s in state %s, but also in manifest1\n") % (f, state))
                         errors += 1
                     if state in "m" and f not in m1 and f not in m2:
                         ui.warn(_("%s in state %s, but not in either manifest\n") %
                                 (f, state))
                         errors += 1
                 for f in m1:
                     state = repo.dirstate[f]
                     if state not in "nrm":
                         ui.warn(_("%s in manifest1, but listed as state %s") % (f, state))
                         errors += 1
                 if errors:
                     error = _(".hg/dirstate inconsistent with current parent's manifest")
                     raise error.Abort(error)
             @command('debugcolor',
                     [('', 'style', None, _('show all configured styles'))],
                     'hg debugcolor')
             def debugcolor(ui, repo, **opts):
                 """show available color, effects or style"""
                 ui.write(('color mode: %s\n') % stringutil.pprint(ui._colormode))
                 if opts.get(r'style'):
                     return _debugdisplaystyle(ui)
                 else:
                     return _debugdisplaycolor(ui)
             def _debugdisplaycolor(ui):
                 ui = ui.copy()
                 ui._styles.clear()
                 for effect in color._activeeffects(ui).keys():
                     ui._styles[effect] = effect
                 if ui._terminfoparams:
                     for k, v in ui.configitems('color'):
                         if k.startswith('color.'):
                             ui._styles[k] = k[6:]
                         elif k.startswith('terminfo.'):
                             ui._styles[k] = k[9:]
                 ui.write(_('available colors:\n'))
                 # sort label with a '_' after the other to group '_background' entry.
                 items = sorted(ui._styles.items(),
                                key=lambda i: ('_' in i[0], i[0], i[1]))
                 for colorname, label in items:
                     ui.write(('%s\n') % colorname, label=label)
             def _debugdisplaystyle(ui):
                 ui.write(_('available style:\n'))
                 if not ui._styles:
                     return
                 width = max(len(s) for s in ui._styles)
                 for label, effects in sorted(ui._styles.items()):
                     ui.write('%s' % label, label=label)
                     if effects:
                         # 50
                         ui.write(': ')
                         ui.write(' ' * (max(0, width - len(label))))
                         ui.write(', '.join(ui.label(e, e) for e in effects.split()))
                     ui.write('\n')
             @command('debugcreatestreamclonebundle', [], 'FILE')
             def debugcreatestreamclonebundle(ui, repo, fname):
                 """create a stream clone bundle file
                 Stream bundles are special bundles that are essentially archives of
                 revlog files. They are commonly used for cloning very quickly.
                 """
                 # TODO we may want to turn this into an abort when this functionality
                 # is moved into `hg bundle`.
                 if phases.hassecret(repo):
                     ui.warn(_('(warning: stream clone bundle will contain secret '
                               'revisions)\n'))
                 requirements, gen = streamclone.generatebundlev1(repo)
                 changegroup.writechunks(ui, gen, fname)
                 ui.write(_('bundle requirements: %s\n') % ', '.join(sorted(requirements)))
             @command('debugdag',
                 [('t', 'tags', None, _('use tags as labels')),
                 ('b', 'branches', None, _('annotate with branch names')),
                 ('', 'dots', None, _('use dots for runs')),
                 ('s', 'spaces', None, _('separate elements by spaces'))],
                 _('[OPTION]... [FILE [REV]...]'),
                 optionalrepo=True)
             def debugdag(ui, repo, file_=None, *revs, **opts):
                 """format the changelog or an index DAG as a concise textual description
                 If you pass a revlog index, the revlog's DAG is emitted. If you list
                 revision numbers, they get labeled in the output as rN.
                 Otherwise, the changelog DAG of the current repo is emitted.
                 """
                 spaces = opts.get(r'spaces')
                 dots = opts.get(r'dots')
                 if file_:
                     rlog = revlog.revlog(vfsmod.vfs(pycompat.getcwd(), audit=False),
                                          file_)
                     revs = set((int(r) for r in revs))
                     def events():
                         for r in rlog:
                             yield 'n', (r, list(p for p in rlog.parentrevs(r)
                                                     if p != -1))
                             if r in revs:
                                 yield 'l', (r, "r%i" % r)
                 elif repo:
                     cl = repo.changelog
                     tags = opts.get(r'tags')
                     branches = opts.get(r'branches')
                     if tags:
                         labels = {}
                         for l, n in repo.tags().items():
                             labels.setdefault(cl.rev(n), []).append(l)
                     def events():
                         b = "default"
                         for r in cl:
                             if branches:
                                 newb = cl.read(cl.node(r))[5]['branch']
                                 if newb != b:
                                     yield 'a', newb
                                     b = newb
                             yield 'n', (r, list(p for p in cl.parentrevs(r)
                                                     if p != -1))
                             if tags:
                                 ls = labels.get(r)
                                 if ls:
                                     for l in ls:
                                         yield 'l', (r, l)
                 else:
                     raise error.Abort(_('need repo for changelog dag'))
                 for line in dagparser.dagtextlines(events(),
                                                    addspaces=spaces,
                                                    wraplabels=True,
                                                    wrapannotations=True,
                                                    wrapnonlinear=dots,
                                                    usedots=dots,
                                                    maxlinewidth=70):
                     ui.write(line)
                     ui.write("\n")
             @command('debugdata', cmdutil.debugrevlogopts, _('-c|-m|FILE REV'))
             def debugdata(ui, repo, file_, rev=None, **opts):
                 """dump the contents of a data file revision"""
                 opts = pycompat.byteskwargs(opts)
                 if opts.get('changelog') or opts.get('manifest') or opts.get('dir'):
                     if rev is not None:
                         raise error.CommandError('debugdata', _('invalid arguments'))
                     file_, rev = None, file_
                 elif rev is None:
                     raise error.CommandError('debugdata', _('invalid arguments'))
                 r = cmdutil.openstorage(repo, 'debugdata', file_, opts)
                 try:
                     ui.write(r.revision(r.lookup(rev), raw=True))
                 except KeyError:
                     raise error.Abort(_('invalid revision identifier %s') % rev)
             @command('debugdate',
                 [('e', 'extended', None, _('try extended date formats'))],
                 _('[-e] DATE [RANGE]'),
                 norepo=True, optionalrepo=True)
             def debugdate(ui, date, range=None, **opts):
                 """parse and display a date"""
                 if opts[r"extended"]:
                     d = dateutil.parsedate(date, util.extendeddateformats)
                 else:
                     d = dateutil.parsedate(date)
                 ui.write(("internal: %d %d\n") % d)
                 ui.write(("standard: %s\n") % dateutil.datestr(d))
                 if range:
                     m = dateutil.matchdate(range)
                     ui.write(("match: %s\n") % m(d[0]))
             @command('debugdeltachain',
                 cmdutil.debugrevlogopts + cmdutil.formatteropts,
                 _('-c|-m|FILE'),
                 optionalrepo=True)
             def debugdeltachain(ui, repo, file_=None, **opts):
                 """dump information about delta chains in a revlog
                 Output can be templatized. Available template keywords are:
                 :``rev``:       revision number
                 :``chainid``:   delta chain identifier (numbered by unique base)
                 :``chainlen``:  delta chain length to this revision
                 :``prevrev``:   previous revision in delta chain
                 :``deltatype``: role of delta / how it was computed
                 :``compsize``:  compressed size of revision
                 :``uncompsize``: uncompressed size of revision
                 :``chainsize``: total size of compressed revisions in chain
                 :``chainratio``: total chain size divided by uncompressed revision size
                                 (new delta chains typically start at ratio 2.00)
                 :``lindist``:   linear distance from base revision in delta chain to end
                                 of this revision
                 :``extradist``: total size of revisions not part of this delta chain from
                                 base of delta chain to end of this revision; a measurement
                                 of how much extra data we need to read/seek across to read
                                 the delta chain for this revision
                 :``extraratio``: extradist divided by chainsize; another representation of
                                 how much unrelated data is needed to load this delta chain
                 If the repository is configured to use the sparse read, additional keywords
                 are available:
                 :``readsize``:     total size of data read from the disk for a revision
                                    (sum of the sizes of all the blocks)
                 :``largestblock``: size of the largest block of data read from the disk
                 :``readdensity``:  density of useful bytes in the data read from the disk
                 :``srchunks``:  in how many data hunks the whole revision would be read
                 The sparse read can be enabled with experimental.sparse-read = True
                 """
                 opts = pycompat.byteskwargs(opts)
                 r = cmdutil.openrevlog(repo, 'debugdeltachain', file_, opts)
                 index = r.index
                 start = r.start
                 length = r.length
                 generaldelta = r.version & revlog.FLAG_GENERALDELTA
                 withsparseread = getattr(r, '_withsparseread', False)
                 def revinfo(rev):
                     e = index[rev]
                     compsize = e[1]
                     uncompsize = e[2]
                     chainsize = 0
                     if generaldelta:
                         if e[3] == e[5]:
                             deltatype = 'p1'
                         elif e[3] == e[6]:
                             deltatype = 'p2'
                         elif e[3] == rev - 1:
                             deltatype = 'prev'
                         elif e[3] == rev:
                             deltatype = 'base'
                         else:
                             deltatype = 'other'
                     else:
                         if e[3] == rev:
                             deltatype = 'base'
                         else:
                             deltatype = 'prev'
                     chain = r._deltachain(rev)[0]
                     for iterrev in chain:
                         e = index[iterrev]
                         chainsize += e[1]
                     return compsize, uncompsize, deltatype, chain, chainsize
                 fm = ui.formatter('debugdeltachain', opts)
                 fm.plain('    rev  chain# chainlen     prev   delta       '
                          'size    rawsize  chainsize     ratio   lindist extradist '
                          'extraratio')
                 if withsparseread:
                     fm.plain('   readsize largestblk rddensity srchunks')
                 fm.plain('\n')
                 chainbases = {}
                 for rev in r:
                     comp, uncomp, deltatype, chain, chainsize = revinfo(rev)
                     chainbase = chain[0]
                     chainid = chainbases.setdefault(chainbase, len(chainbases) + 1)
                     basestart = start(chainbase)
                     revstart = start(rev)
                     lineardist = revstart + comp - basestart
                     extradist = lineardist - chainsize
                     try:
                         prevrev = chain[-2]
                     except IndexError:
                         prevrev = -1
                     if uncomp != 0:
                         chainratio = float(chainsize) / float(uncomp)
                     else:
                         chainratio = chainsize
                     if chainsize != 0:
                         extraratio = float(extradist) / float(chainsize)
                     else:
                         extraratio = extradist
                     fm.startitem()
                     fm.write('rev chainid chainlen prevrev deltatype compsize '
                              'uncompsize chainsize chainratio lindist extradist '
                              'extraratio',
                              '%7d %7d %8d %8d %7s %10d %10d %10d %9.5f %9d %9d %10.5f',
                              rev, chainid, len(chain), prevrev, deltatype, comp,
                              uncomp, chainsize, chainratio, lineardist, extradist,
                              extraratio,
                              rev=rev, chainid=chainid, chainlen=len(chain),
                              prevrev=prevrev, deltatype=deltatype, compsize=comp,
                              uncompsize=uncomp, chainsize=chainsize,
                              chainratio=chainratio, lindist=lineardist,
                              extradist=extradist, extraratio=extraratio)
                     if withsparseread:
                         readsize = 0
                         largestblock = 0
                         srchunks = 0
-                        for revschunk in revlog._slicechunk(r, chain):
+                        for revschunk in deltautil.slicechunk(r, chain):
                             srchunks += 1
                             blkend = start(revschunk[-1]) + length(revschunk[-1])
                             blksize = blkend - start(revschunk[0])
                             readsize += blksize
                             if largestblock < blksize:
                                 largestblock = blksize
                         if readsize:
                             readdensity = float(chainsize) / float(readsize)
                         else:
                             readdensity = 1
                         fm.write('readsize largestblock readdensity srchunks',
                                  ' %10d %10d %9.5f %8d',
                                  readsize, largestblock, readdensity, srchunks,
                                  readsize=readsize, largestblock=largestblock,
                                  readdensity=readdensity, srchunks=srchunks)
                     fm.plain('\n')
                 fm.end()
             @command('debugdirstate|debugstate',
                 [('', 'nodates', None, _('do not display the saved mtime')),
                 ('', 'datesort', None, _('sort by saved mtime'))],
                 _('[OPTION]...'))
             def debugstate(ui, repo, **opts):
                 """show the contents of the current dirstate"""
                 nodates = opts.get(r'nodates')
                 datesort = opts.get(r'datesort')
                 timestr = ""
                 if datesort:
                     keyfunc = lambda x: (x[1][3], x[0]) # sort by mtime, then by filename
                 else:
                     keyfunc = None # sort by filename
                 for file_, ent in sorted(repo.dirstate._map.iteritems(), key=keyfunc):
                     if ent[3] == -1:
                         timestr = 'unset               '
                     elif nodates:
                         timestr = 'set                 '
                     else:
                         timestr = time.strftime(r"%Y-%m-%d %H:%M:%S ",
                                                 time.localtime(ent[3]))
                         timestr = encoding.strtolocal(timestr)
                     if ent[1] & 0o20000:
                         mode = 'lnk'
                     else:
                         mode = '%3o' % (ent[1] & 0o777 & ~util.umask)
                     ui.write("%c %s %10d %s%s\n" % (ent[0], mode, ent[2], timestr, file_))
                 for f in repo.dirstate.copies():
                     ui.write(_("copy: %s -> %s\n") % (repo.dirstate.copied(f), f))
             @command('debugdiscovery',
                 [('', 'old', None, _('use old-style discovery')),
                 ('', 'nonheads', None,
                  _('use old-style discovery with non-heads included')),
                 ('', 'rev', [], 'restrict discovery to this set of revs'),
                 ] + cmdutil.remoteopts,
                 _('[--rev REV] [OTHER]'))
             def debugdiscovery(ui, repo, remoteurl="default", **opts):
                 """runs the changeset discovery protocol in isolation"""
                 opts = pycompat.byteskwargs(opts)
                 remoteurl, branches = hg.parseurl(ui.expandpath(remoteurl))
                 remote = hg.peer(repo, opts, remoteurl)
                 ui.status(_('comparing with %s\n') % util.hidepassword(remoteurl))
                 # make sure tests are repeatable
                 random.seed(12323)
                 def doit(pushedrevs, remoteheads, remote=remote):
                     if opts.get('old'):
                         if not util.safehasattr(remote, 'branches'):
                             # enable in-client legacy support
                             remote = localrepo.locallegacypeer(remote.local())
                         common, _in, hds = treediscovery.findcommonincoming(repo, remote,
                                                                             force=True)
                         common = set(common)
                         if not opts.get('nonheads'):
                             ui.write(("unpruned common: %s\n") %
                                      " ".join(sorted(short(n) for n in common)))
                             clnode = repo.changelog.node
                             common = repo.revs('heads(::%ln)', common)
                             common = {clnode(r) for r in common}
                     else:
                         nodes = None
                         if pushedrevs:
                             revs = scmutil.revrange(repo, pushedrevs)
                             nodes = [repo[r].node() for r in revs]
                         common, any, hds = setdiscovery.findcommonheads(ui, repo, remote,
                                                                         ancestorsof=nodes)
                     common = set(common)
                     rheads = set(hds)
                     lheads = set(repo.heads())
                     ui.write(("common heads: %s\n") %
                              " ".join(sorted(short(n) for n in common)))
                     if lheads <= common:
                         ui.write(("local is subset\n"))
                     elif rheads <= common:
                         ui.write(("remote is subset\n"))
                 remoterevs, _checkout = hg.addbranchrevs(repo, remote, branches, revs=None)
                 localrevs = opts['rev']
                 doit(localrevs, remoterevs)
             _chunksize = 4 << 10
             @command('debugdownload',
                 [
                     ('o', 'output', '', _('path')),
                 ],
                 optionalrepo=True)
             def debugdownload(ui, repo, url, output=None, **opts):
                 """download a resource using Mercurial logic and config
                 """
                 fh = urlmod.open(ui, url, output)
                 dest = ui
                 if output:
                     dest = open(output, "wb", _chunksize)
                 try:
                     data = fh.read(_chunksize)
                     while data:
                         dest.write(data)
                         data = fh.read(_chunksize)
                 finally:
                     if output:
                         dest.close()
             @command('debugextensions', cmdutil.formatteropts, [], optionalrepo=True)
             def debugextensions(ui, repo, **opts):
                 '''show information about active extensions'''
                 opts = pycompat.byteskwargs(opts)
                 exts = extensions.extensions(ui)
                 hgver = util.version()
                 fm = ui.formatter('debugextensions', opts)
                 for extname, extmod in sorted(exts, key=operator.itemgetter(0)):
                     isinternal = extensions.ismoduleinternal(extmod)
                     extsource = pycompat.fsencode(extmod.__file__)
                     if isinternal:
                         exttestedwith = []  # never expose magic string to users
                     else:
                         exttestedwith = getattr(extmod, 'testedwith', '').split()
                     extbuglink = getattr(extmod, 'buglink', None)
                     fm.startitem()
                     if ui.quiet or ui.verbose:
                         fm.write('name', '%s\n', extname)
                     else:
                         fm.write('name', '%s', extname)
                         if isinternal or hgver in exttestedwith:
                             fm.plain('\n')
                         elif not exttestedwith:
                             fm.plain(_(' (untested!)\n'))
                         else:
                             lasttestedversion = exttestedwith[-1]
                             fm.plain(' (%s!)\n' % lasttestedversion)
                     fm.condwrite(ui.verbose and extsource, 'source',
                              _('  location: %s\n'), extsource or "")
                     if ui.verbose:
                         fm.plain(_('  bundled: %s\n') % ['no', 'yes'][isinternal])
                     fm.data(bundled=isinternal)
                     fm.condwrite(ui.verbose and exttestedwith, 'testedwith',
                                  _('  tested with: %s\n'),
                                  fm.formatlist(exttestedwith, name='ver'))
                     fm.condwrite(ui.verbose and extbuglink, 'buglink',
                              _('  bug reporting: %s\n'), extbuglink or "")
                 fm.end()
             @command('debugfileset',
                 [('r', 'rev', '', _('apply the filespec on this revision'), _('REV')),
                  ('', 'all-files', False,
                   _('test files from all revisions and working directory')),
                  ('s', 'show-matcher', None,
                   _('print internal representation of matcher')),
                  ('p', 'show-stage', [],
                   _('print parsed tree at the given stage'), _('NAME'))],
                 _('[-r REV] [--all-files] [OPTION]... FILESPEC'))
             def debugfileset(ui, repo, expr, **opts):
                 '''parse and apply a fileset specification'''
                 from . import fileset
                 fileset.symbols # force import of fileset so we have predicates to optimize
                 opts = pycompat.byteskwargs(opts)
                 ctx = scmutil.revsingle(repo, opts.get('rev'), None)
                 stages = [
                     ('parsed', pycompat.identity),
                     ('analyzed', filesetlang.analyze),
                     ('optimized', filesetlang.optimize),
                 ]
                 stagenames = set(n for n, f in stages)
                 showalways = set()
                 if ui.verbose and not opts['show_stage']:
                     # show parsed tree by --verbose (deprecated)
                     showalways.add('parsed')
                 if opts['show_stage'] == ['all']:
                     showalways.update(stagenames)
                 else:
                     for n in opts['show_stage']:
                         if n not in stagenames:
                             raise error.Abort(_('invalid stage name: %s') % n)
                     showalways.update(opts['show_stage'])
                 tree = filesetlang.parse(expr)
                 for n, f in stages:
                     tree = f(tree)
                     if n in showalways:
                         if opts['show_stage'] or n != 'parsed':
                             ui.write(("* %s:\n") % n)
                         ui.write(filesetlang.prettyformat(tree), "\n")
                 files = set()
                 if opts['all_files']:
                     for r in repo:
                         c = repo[r]
                         files.update(c.files())
                         files.update(c.substate)
                 if opts['all_files'] or ctx.rev() is None:
                     wctx = repo[None]
                     files.update(repo.dirstate.walk(scmutil.matchall(repo),
                                                     subrepos=list(wctx.substate),
                                                     unknown=True, ignored=True))
                     files.update(wctx.substate)
                 else:
                     files.update(ctx.files())
                     files.update(ctx.substate)
                 m = ctx.matchfileset(expr)
                 if opts['show_matcher'] or (opts['show_matcher'] is None and ui.verbose):
                     ui.write(('* matcher:\n'), stringutil.prettyrepr(m), '\n')
                 for f in sorted(files):
                     if not m(f):
                         continue
                     ui.write("%s\n" % f)
             @command('debugformat',
                      [] + cmdutil.formatteropts)
             def debugformat(ui, repo, **opts):
                 """display format information about the current repository
                 Use --verbose to get extra information about current config value and
                 Mercurial default."""
                 opts = pycompat.byteskwargs(opts)
                 maxvariantlength = max(len(fv.name) for fv in upgrade.allformatvariant)
                 maxvariantlength = max(len('format-variant'), maxvariantlength)
                 def makeformatname(name):
                     return '%s:' + (' ' * (maxvariantlength - len(name)))
                 fm = ui.formatter('debugformat', opts)
                 if fm.isplain():
                     def formatvalue(value):
                         if util.safehasattr(value, 'startswith'):
                             return value
                         if value:
                             return 'yes'
                         else:
                             return 'no'
                 else:
                     formatvalue = pycompat.identity
                 fm.plain('format-variant')
                 fm.plain(' ' * (maxvariantlength - len('format-variant')))
                 fm.plain(' repo')
                 if ui.verbose:
                     fm.plain(' config default')
                 fm.plain('\n')
                 for fv in upgrade.allformatvariant:
                     fm.startitem()
                     repovalue = fv.fromrepo(repo)
                     configvalue = fv.fromconfig(repo)
                     if repovalue != configvalue:
                         namelabel = 'formatvariant.name.mismatchconfig'
                         repolabel = 'formatvariant.repo.mismatchconfig'
                     elif repovalue != fv.default:
                         namelabel = 'formatvariant.name.mismatchdefault'
                         repolabel = 'formatvariant.repo.mismatchdefault'
                     else:
                         namelabel = 'formatvariant.name.uptodate'
                         repolabel = 'formatvariant.repo.uptodate'
                     fm.write('name', makeformatname(fv.name), fv.name,
                              label=namelabel)
                     fm.write('repo', ' %3s', formatvalue(repovalue),
                              label=repolabel)
                     if fv.default != configvalue:
                         configlabel = 'formatvariant.config.special'
                     else:
                         configlabel = 'formatvariant.config.default'
                     fm.condwrite(ui.verbose, 'config', ' %6s', formatvalue(configvalue),
                                  label=configlabel)
                     fm.condwrite(ui.verbose, 'default', ' %7s', formatvalue(fv.default),
                                  label='formatvariant.default')
                     fm.plain('\n')
                 fm.end()
             @command('debugfsinfo', [], _('[PATH]'), norepo=True)
             def debugfsinfo(ui, path="."):
                 """show information detected about current filesystem"""
                 ui.write(('path: %s\n') % path)
                 ui.write(('mounted on: %s\n') % (util.getfsmountpoint(path) or '(unknown)'))
                 ui.write(('exec: %s\n') % (util.checkexec(path) and 'yes' or 'no'))
                 ui.write(('fstype: %s\n') % (util.getfstype(path) or '(unknown)'))
                 ui.write(('symlink: %s\n') % (util.checklink(path) and 'yes' or 'no'))
                 ui.write(('hardlink: %s\n') % (util.checknlink(path) and 'yes' or 'no'))
                 casesensitive = '(unknown)'
                 try:
                     with pycompat.namedtempfile(prefix='.debugfsinfo', dir=path) as f:
                         casesensitive = util.fscasesensitive(f.name) and 'yes' or 'no'
                 except OSError:
                     pass
                 ui.write(('case-sensitive: %s\n') % casesensitive)
             @command('debuggetbundle',
                 [('H', 'head', [], _('id of head node'), _('ID')),
                 ('C', 'common', [], _('id of common node'), _('ID')),
                 ('t', 'type', 'bzip2', _('bundle compression type to use'), _('TYPE'))],
                 _('REPO FILE [-H|-C ID]...'),
                 norepo=True)
             def debuggetbundle(ui, repopath, bundlepath, head=None, common=None, **opts):
                 """retrieves a bundle from a repo
                 Every ID must be a full-length hex node id string. Saves the bundle to the
                 given file.
                 """
                 opts = pycompat.byteskwargs(opts)
                 repo = hg.peer(ui, opts, repopath)
                 if not repo.capable('getbundle'):
                     raise error.Abort("getbundle() not supported by target repository")
                 args = {}
                 if common:
                     args[r'common'] = [bin(s) for s in common]
                 if head:
                     args[r'heads'] = [bin(s) for s in head]
                 # TODO: get desired bundlecaps from command line.
                 args[r'bundlecaps'] = None
                 bundle = repo.getbundle('debug', **args)
                 bundletype = opts.get('type', 'bzip2').lower()
                 btypes = {'none': 'HG10UN',
                           'bzip2': 'HG10BZ',
                           'gzip': 'HG10GZ',
                           'bundle2': 'HG20'}
                 bundletype = btypes.get(bundletype)
                 if bundletype not in bundle2.bundletypes:
                     raise error.Abort(_('unknown bundle type specified with --type'))
                 bundle2.writebundle(ui, bundle, bundlepath, bundletype)
             @command('debugignore', [], '[FILE]')
             def debugignore(ui, repo, *files, **opts):
                 """display the combined ignore pattern and information about ignored files
                 With no argument display the combined ignore pattern.
                 Given space separated file names, shows if the given file is ignored and
                 if so, show the ignore rule (file and line number) that matched it.
                 """
                 ignore = repo.dirstate._ignore
                 if not files:
                     # Show all the patterns
                     ui.write("%s\n" % pycompat.byterepr(ignore))
                 else:
                     m = scmutil.match(repo[None], pats=files)
                     for f in m.files():
                         nf = util.normpath(f)
                         ignored = None
                         ignoredata = None
                         if nf != '.':
                             if ignore(nf):
                                 ignored = nf
                                 ignoredata = repo.dirstate._ignorefileandline(nf)
                             else:
                                 for p in util.finddirs(nf):
                                     if ignore(p):
                                         ignored = p
                                         ignoredata = repo.dirstate._ignorefileandline(p)
                                         break
                         if ignored:
                             if ignored == nf:
                                 ui.write(_("%s is ignored\n") % m.uipath(f))
                             else:
                                 ui.write(_("%s is ignored because of "
                                            "containing folder %s\n")
                                          % (m.uipath(f), ignored))
                             ignorefile, lineno, line = ignoredata
                             ui.write(_("(ignore rule in %s, line %d: '%s')\n")
                                      % (ignorefile, lineno, line))
                         else:
                             ui.write(_("%s is not ignored\n") % m.uipath(f))
             @command('debugindex', cmdutil.debugrevlogopts + cmdutil.formatteropts,
                      _('-c|-m|FILE'))
             def debugindex(ui, repo, file_=None, **opts):
                 """dump index data for a storage primitive"""
                 opts = pycompat.byteskwargs(opts)
                 store = cmdutil.openstorage(repo, 'debugindex', file_, opts)
                 if ui.debugflag:
                     shortfn = hex
                 else:
                     shortfn = short
                 idlen = 12
                 for i in store:
                     idlen = len(shortfn(store.node(i)))
                     break
                 fm = ui.formatter('debugindex', opts)
                 fm.plain(b'   rev linkrev %s %s p2\n' % (
                     b'nodeid'.ljust(idlen),
                     b'p1'.ljust(idlen)))
                 for rev in store:
                     node = store.node(rev)
                     parents = store.parents(node)
                     fm.startitem()
                     fm.write(b'rev', b'%6d ', rev)
                     fm.write(b'linkrev', '%7d ', store.linkrev(rev))
                     fm.write(b'node', '%s ', shortfn(node))
                     fm.write(b'p1', '%s ', shortfn(parents[0]))
                     fm.write(b'p2', '%s', shortfn(parents[1]))
                     fm.plain(b'\n')
                 fm.end()
             @command('debugindexdot', cmdutil.debugrevlogopts,
                 _('-c|-m|FILE'), optionalrepo=True)
             def debugindexdot(ui, repo, file_=None, **opts):
                 """dump an index DAG as a graphviz dot file"""
                 opts = pycompat.byteskwargs(opts)
                 r = cmdutil.openstorage(repo, 'debugindexdot', file_, opts)
                 ui.write(("digraph G {\n"))
                 for i in r:
                     node = r.node(i)
                     pp = r.parents(node)
                     ui.write("\t%d -> %d\n" % (r.rev(pp[0]), i))
                     if pp[1] != nullid:
                         ui.write("\t%d -> %d\n" % (r.rev(pp[1]), i))
                 ui.write("}\n")
             @command('debuginstall', [] + cmdutil.formatteropts, '', norepo=True)
             def debuginstall(ui, **opts):
                 '''test Mercurial installation
                 Returns 0 on success.
                 '''
                 opts = pycompat.byteskwargs(opts)
                 def writetemp(contents):
                     (fd, name) = pycompat.mkstemp(prefix="hg-debuginstall-")
                     f = os.fdopen(fd, r"wb")
                     f.write(contents)
                     f.close()
                     return name
                 problems = 0
                 fm = ui.formatter('debuginstall', opts)
                 fm.startitem()
                 # encoding
                 fm.write('encoding', _("checking encoding (%s)...\n"), encoding.encoding)
                 err = None
                 try:
                     codecs.lookup(pycompat.sysstr(encoding.encoding))
                 except LookupError as inst:
                     err = stringutil.forcebytestr(inst)
                     problems += 1
                 fm.condwrite(err, 'encodingerror', _(" %s\n"
                              " (check that your locale is properly set)\n"), err)
                 # Python
                 fm.write('pythonexe', _("checking Python executable (%s)\n"),
                          pycompat.sysexecutable)
                 fm.write('pythonver', _("checking Python version (%s)\n"),
                          ("%d.%d.%d" % sys.version_info[:3]))
                 fm.write('pythonlib', _("checking Python lib (%s)...\n"),
                          os.path.dirname(pycompat.fsencode(os.__file__)))
                 security = set(sslutil.supportedprotocols)
                 if sslutil.hassni:
                     security.add('sni')
                 fm.write('pythonsecurity', _("checking Python security support (%s)\n"),
                          fm.formatlist(sorted(security), name='protocol',
                                        fmt='%s', sep=','))
                 # These are warnings, not errors. So don't increment problem count. This
                 # may change in the future.
                 if 'tls1.2' not in security:
                     fm.plain(_('  TLS 1.2 not supported by Python install; '
                                'network connections lack modern security\n'))
                 if 'sni' not in security:
                     fm.plain(_('  SNI not supported by Python install; may have '
                                'connectivity issues with some servers\n'))
                 # TODO print CA cert info
                 # hg version
                 hgver = util.version()
                 fm.write('hgver', _("checking Mercurial version (%s)\n"),
                          hgver.split('+')[0])
                 fm.write('hgverextra', _("checking Mercurial custom build (%s)\n"),
                          '+'.join(hgver.split('+')[1:]))
                 # compiled modules
                 fm.write('hgmodulepolicy', _("checking module policy (%s)\n"),
                          policy.policy)
                 fm.write('hgmodules', _("checking installed modules (%s)...\n"),
                          os.path.dirname(pycompat.fsencode(__file__)))
                 if policy.policy in ('c', 'allow'):
                     err = None
                     try:
                         from .cext import (
                             base85,
                             bdiff,
                             mpatch,
                             osutil,
                         )
                         dir(bdiff), dir(mpatch), dir(base85), dir(osutil) # quiet pyflakes
                     except Exception as inst:
                         err = stringutil.forcebytestr(inst)
                         problems += 1
                     fm.condwrite(err, 'extensionserror', " %s\n", err)
                 compengines = util.compengines._engines.values()
                 fm.write('compengines', _('checking registered compression engines (%s)\n'),
                          fm.formatlist(sorted(e.name() for e in compengines),
                                        name='compengine', fmt='%s', sep=', '))
                 fm.write('compenginesavail', _('checking available compression engines '
                                                '(%s)\n'),
                          fm.formatlist(sorted(e.name() for e in compengines
                                               if e.available()),
                                        name='compengine', fmt='%s', sep=', '))
                 wirecompengines = util.compengines.supportedwireengines(util.SERVERROLE)
                 fm.write('compenginesserver', _('checking available compression engines '
                                                 'for wire protocol (%s)\n'),
                          fm.formatlist([e.name() for e in wirecompengines
                                         if e.wireprotosupport()],
                                        name='compengine', fmt='%s', sep=', '))
                 re2 = 'missing'
                 if util._re2:
                     re2 = 'available'
                 fm.plain(_('checking "re2" regexp engine (%s)\n') % re2)
                 fm.data(re2=bool(util._re2))
                 # templates
                 p = templater.templatepaths()
                 fm.write('templatedirs', 'checking templates (%s)...\n', ' '.join(p))
                 fm.condwrite(not p, '', _(" no template directories found\n"))
                 if p:
                     m = templater.templatepath("map-cmdline.default")
                     if m:
                         # template found, check if it is working
                         err = None
                         try:
                             templater.templater.frommapfile(m)
                         except Exception as inst:
                             err = stringutil.forcebytestr(inst)
                             p = None
                         fm.condwrite(err, 'defaulttemplateerror', " %s\n", err)
                     else:
                         p = None
                     fm.condwrite(p, 'defaulttemplate',
                                  _("checking default template (%s)\n"), m)
                     fm.condwrite(not m, 'defaulttemplatenotfound',
                                  _(" template '%s' not found\n"), "default")
                 if not p:
                     problems += 1
                 fm.condwrite(not p, '',
                              _(" (templates seem to have been installed incorrectly)\n"))
                 # editor
                 editor = ui.geteditor()
                 editor = util.expandpath(editor)
                 editorbin = procutil.shellsplit(editor)[0]
                 fm.write('editor', _("checking commit editor... (%s)\n"), editorbin)
                 cmdpath = procutil.findexe(editorbin)
                 fm.condwrite(not cmdpath and editor == 'vi', 'vinotfound',
                              _(" No commit editor set and can't find %s in PATH\n"
                                " (specify a commit editor in your configuration"
                                " file)\n"), not cmdpath and editor == 'vi' and editorbin)
                 fm.condwrite(not cmdpath and editor != 'vi', 'editornotfound',
                              _(" Can't find editor '%s' in PATH\n"
                                " (specify a commit editor in your configuration"
                                " file)\n"), not cmdpath and editorbin)
                 if not cmdpath and editor != 'vi':
                     problems += 1
                 # check username
                 username = None
                 err = None
                 try:
                     username = ui.username()
                 except error.Abort as e:
                     err = stringutil.forcebytestr(e)
                     problems += 1
                 fm.condwrite(username, 'username',  _("checking username (%s)\n"), username)
                 fm.condwrite(err, 'usernameerror', _("checking username...\n %s\n"
                     " (specify a username in your configuration file)\n"), err)
                 fm.condwrite(not problems, '',
                              _("no problems detected\n"))
                 if not problems:
                     fm.data(problems=problems)
                 fm.condwrite(problems, 'problems',
                              _("%d problems detected,"
                                " please check your install!\n"), problems)
                 fm.end()
                 return problems
             @command('debugknown', [], _('REPO ID...'), norepo=True)
             def debugknown(ui, repopath, *ids, **opts):
                 """test whether node ids are known to a repo
                 Every ID must be a full-length hex node id string. Returns a list of 0s
                 and 1s indicating unknown/known.
                 """
                 opts = pycompat.byteskwargs(opts)
                 repo = hg.peer(ui, opts, repopath)
                 if not repo.capable('known'):
                     raise error.Abort("known() not supported by target repository")
                 flags = repo.known([bin(s) for s in ids])
                 ui.write("%s\n" % ("".join([f and "1" or "0" for f in flags])))
             @command('debuglabelcomplete', [], _('LABEL...'))
             def debuglabelcomplete(ui, repo, *args):
                 '''backwards compatibility with old bash completion scripts (DEPRECATED)'''
                 debugnamecomplete(ui, repo, *args)
             @command('debuglocks',
                      [('L', 'force-lock', None, _('free the store lock (DANGEROUS)')),
                       ('W', 'force-wlock', None,
                        _('free the working state lock (DANGEROUS)')),
                       ('s', 'set-lock', None, _('set the store lock until stopped')),
                       ('S', 'set-wlock', None,
                        _('set the working state lock until stopped'))],
                      _('[OPTION]...'))
             def debuglocks(ui, repo, **opts):
                 """show or modify state of locks
                 By default, this command will show which locks are held. This
                 includes the user and process holding the lock, the amount of time
                 the lock has been held, and the machine name where the process is
                 running if it's not local.
                 Locks protect the integrity of Mercurial's data, so should be
                 treated with care. System crashes or other interruptions may cause
                 locks to not be properly released, though Mercurial will usually
                 detect and remove such stale locks automatically.
                 However, detecting stale locks may not always be possible (for
                 instance, on a shared filesystem). Removing locks may also be
                 blocked by filesystem permissions.
                 Setting a lock will prevent other commands from changing the data.
                 The command will wait until an interruption (SIGINT, SIGTERM, ...) occurs.
                 The set locks are removed when the command exits.
                 Returns 0 if no locks are held.
                 """
                 if opts.get(r'force_lock'):
                     repo.svfs.unlink('lock')
                 if opts.get(r'force_wlock'):
                     repo.vfs.unlink('wlock')
                 if opts.get(r'force_lock') or opts.get(r'force_wlock'):
                     return 0
                 locks = []
                 try:
                     if opts.get(r'set_wlock'):
                         try:
                             locks.append(repo.wlock(False))
                         except error.LockHeld:
                             raise error.Abort(_('wlock is already held'))
                     if opts.get(r'set_lock'):
                         try:
                             locks.append(repo.lock(False))
                         except error.LockHeld:
                             raise error.Abort(_('lock is already held'))
                     if len(locks):
                         ui.promptchoice(_("ready to release the lock (y)? $$ &Yes"))
                         return 0
                 finally:
                     release(*locks)
                 now = time.time()
                 held = 0
                 def report(vfs, name, method):
                     # this causes stale locks to get reaped for more accurate reporting
                     try:
                         l = method(False)
                     except error.LockHeld:
                         l = None
                     if l:
                         l.release()
                     else:
                         try:
                             st = vfs.lstat(name)
                             age = now - st[stat.ST_MTIME]
                             user = util.username(st.st_uid)
                             locker = vfs.readlock(name)
                             if ":" in locker:
                                 host, pid = locker.split(':')
                                 if host == socket.gethostname():
                                     locker = 'user %s, process %s' % (user, pid)
                                 else:
                                     locker = 'user %s, process %s, host %s' \
                                              % (user, pid, host)
                             ui.write(("%-6s %s (%ds)\n") % (name + ":", locker, age))
                             return 1
                         except OSError as e:
                             if e.errno != errno.ENOENT:
                                 raise
                     ui.write(("%-6s free\n") % (name + ":"))
                     return 0
                 held += report(repo.svfs, "lock", repo.lock)
                 held += report(repo.vfs, "wlock", repo.wlock)
                 return held
             @command('debugmanifestfulltextcache', [
                     ('', 'clear', False, _('clear the cache')),
                     ('a', 'add', '', _('add the given manifest node to the cache'),
                      _('NODE'))
                 ], '')
             def debugmanifestfulltextcache(ui, repo, add=None, **opts):
                 """show, clear or amend the contents of the manifest fulltext cache"""
                 with repo.lock():
                     r = repo.manifestlog.getstorage(b'')
                     try:
                         cache = r._fulltextcache
                     except AttributeError:
                         ui.warn(_(
                             "Current revlog implementation doesn't appear to have a "
                             'manifest fulltext cache\n'))
                         return
                     if opts.get(r'clear'):
                         cache.clear()
                     if add:
                         try:
                             manifest = repo.manifestlog[r.lookup(add)]
                         except error.LookupError as e:
                             raise error.Abort(e, hint="Check your manifest node id")
                         manifest.read()  # stores revisision in cache too
                     if not len(cache):
                         ui.write(_('Cache empty'))
                     else:
                         ui.write(
                             _('Cache contains %d manifest entries, in order of most to '
                               'least recent:\n') % (len(cache),))
                         totalsize = 0
                         for nodeid in cache:
                             # Use cache.get to not update the LRU order
                             data = cache.get(nodeid)
                             size = len(data)
                             totalsize += size + 24   # 20 bytes nodeid, 4 bytes size
                             ui.write(_('id: %s, size %s\n') % (
                                 hex(nodeid), util.bytecount(size)))
                         ondisk = cache._opener.stat('manifestfulltextcache').st_size
                         ui.write(
                             _('Total cache data size %s, on-disk %s\n') % (
                                 util.bytecount(totalsize), util.bytecount(ondisk))
                         )
             @command('debugmergestate', [], '')
             def debugmergestate(ui, repo, *args):
                 """print merge state
                 Use --verbose to print out information about whether v1 or v2 merge state
                 was chosen."""
                 def _hashornull(h):
                     if h == nullhex:
                         return 'null'
                     else:
                         return h
                 def printrecords(version):
                     ui.write(('* version %d records\n') % version)
                     if version == 1:
                         records = v1records
                     else:
                         records = v2records
                     for rtype, record in records:
                         # pretty print some record types
                         if rtype == 'L':
                             ui.write(('local: %s\n') % record)
                         elif rtype == 'O':
                             ui.write(('other: %s\n') % record)
                         elif rtype == 'm':
                             driver, mdstate = record.split('\0', 1)
                             ui.write(('merge driver: %s (state "%s")\n')
                                      % (driver, mdstate))
                         elif rtype in 'FDC':
                             r = record.split('\0')
                             f, state, hash, lfile, afile, anode, ofile = r[0:7]
                             if version == 1:
                                 onode = 'not stored in v1 format'
                                 flags = r[7]
                             else:
                                 onode, flags = r[7:9]
                             ui.write(('file: %s (record type "%s", state "%s", hash %s)\n')
                                      % (f, rtype, state, _hashornull(hash)))
                             ui.write(('  local path: %s (flags "%s")\n') % (lfile, flags))
                             ui.write(('  ancestor path: %s (node %s)\n')
                                      % (afile, _hashornull(anode)))
                             ui.write(('  other path: %s (node %s)\n')
                                      % (ofile, _hashornull(onode)))
                         elif rtype == 'f':
                             filename, rawextras = record.split('\0', 1)
                             extras = rawextras.split('\0')
                             i = 0
                             extrastrings = []
                             while i < len(extras):
                                 extrastrings.append('%s = %s' % (extras[i], extras[i + 1]))
                                 i += 2
                             ui.write(('file extras: %s (%s)\n')
                                      % (filename, ', '.join(extrastrings)))
                         elif rtype == 'l':
                             labels = record.split('\0', 2)
                             labels = [l for l in labels if len(l) > 0]
                             ui.write(('labels:\n'))
                             ui.write(('  local: %s\n' % labels[0]))
                             ui.write(('  other: %s\n' % labels[1]))
                             if len(labels) > 2:
                                 ui.write(('  base:  %s\n' % labels[2]))
                         else:
                             ui.write(('unrecognized entry: %s\t%s\n')
                                      % (rtype, record.replace('\0', '\t')))
                 # Avoid mergestate.read() since it may raise an exception for unsupported
                 # merge state records. We shouldn't be doing this, but this is OK since this
                 # command is pretty low-level.
                 ms = mergemod.mergestate(repo)
                 # sort so that reasonable information is on top
                 v1records = ms._readrecordsv1()
                 v2records = ms._readrecordsv2()
                 order = 'LOml'
                 def key(r):
                     idx = order.find(r[0])
                     if idx == -1:
                         return (1, r[1])
                     else:
                         return (0, idx)
                 v1records.sort(key=key)
                 v2records.sort(key=key)
                 if not v1records and not v2records:
                     ui.write(('no merge state found\n'))
                 elif not v2records:
                     ui.note(('no version 2 merge state\n'))
                     printrecords(1)
                 elif ms._v1v2match(v1records, v2records):
                     ui.note(('v1 and v2 states match: using v2\n'))
                     printrecords(2)
                 else:
                     ui.note(('v1 and v2 states mismatch: using v1\n'))
                     printrecords(1)
                     if ui.verbose:
                         printrecords(2)
             @command('debugnamecomplete', [], _('NAME...'))
             def debugnamecomplete(ui, repo, *args):
                 '''complete "names" - tags, open branch names, bookmark names'''
                 names = set()
                 # since we previously only listed open branches, we will handle that
                 # specially (after this for loop)
                 for name, ns in repo.names.iteritems():
                     if name != 'branches':
                         names.update(ns.listnames(repo))
                 names.update(tag for (tag, heads, tip, closed)
                              in repo.branchmap().iterbranches() if not closed)
                 completions = set()
                 if not args:
                     args = ['']
                 for a in args:
                     completions.update(n for n in names if n.startswith(a))
                 ui.write('\n'.join(sorted(completions)))
                 ui.write('\n')
             @command('debugobsolete',
                     [('', 'flags', 0, _('markers flag')),
                      ('', 'record-parents', False,
                       _('record parent information for the precursor')),
                      ('r', 'rev', [], _('display markers relevant to REV')),
                      ('', 'exclusive', False, _('restrict display to markers only '
                                                 'relevant to REV')),
                      ('', 'index', False, _('display index of the marker')),
                      ('', 'delete', [], _('delete markers specified by indices')),
                     ] + cmdutil.commitopts2 + cmdutil.formatteropts,
                      _('[OBSOLETED [REPLACEMENT ...]]'))
             def debugobsolete(ui, repo, precursor=None, *successors, **opts):
                 """create arbitrary obsolete marker
                 With no arguments, displays the list of obsolescence markers."""
                 opts = pycompat.byteskwargs(opts)
                 def parsenodeid(s):
                     try:
                         # We do not use revsingle/revrange functions here to accept
                         # arbitrary node identifiers, possibly not present in the
                         # local repository.
                         n = bin(s)
                         if len(n) != len(nullid):
                             raise TypeError()
                         return n
                     except TypeError:
                         raise error.Abort('changeset references must be full hexadecimal '
                                          'node identifiers')
                 if opts.get('delete'):
                     indices = []
                     for v in opts.get('delete'):
                         try:
                             indices.append(int(v))
                         except ValueError:
                             raise error.Abort(_('invalid index value: %r') % v,
                                               hint=_('use integers for indices'))
                     if repo.currenttransaction():
                         raise error.Abort(_('cannot delete obsmarkers in the middle '
                                             'of transaction.'))
                     with repo.lock():
                         n = repair.deleteobsmarkers(repo.obsstore, indices)
                         ui.write(_('deleted %i obsolescence markers\n') % n)
                     return
                 if precursor is not None:
                     if opts['rev']:
                         raise error.Abort('cannot select revision when creating marker')
                     metadata = {}
                     metadata['user'] = encoding.fromlocal(opts['user'] or ui.username())
                     succs = tuple(parsenodeid(succ) for succ in successors)
                     l = repo.lock()
                     try:
                         tr = repo.transaction('debugobsolete')
                         try:
                             date = opts.get('date')
                             if date:
                                 date = dateutil.parsedate(date)
                             else:
                                 date = None
                             prec = parsenodeid(precursor)
                             parents = None
                             if opts['record_parents']:
                                 if prec not in repo.unfiltered():
                                     raise error.Abort('cannot used --record-parents on '
                                                      'unknown changesets')
                                 parents = repo.unfiltered()[prec].parents()
                                 parents = tuple(p.node() for p in parents)
                             repo.obsstore.create(tr, prec, succs, opts['flags'],
                                                  parents=parents, date=date,
                                                  metadata=metadata, ui=ui)
                             tr.close()
                         except ValueError as exc:
                             raise error.Abort(_('bad obsmarker input: %s') %
                                               pycompat.bytestr(exc))
                         finally:
                             tr.release()
                     finally:
                         l.release()
                 else:
                     if opts['rev']:
                         revs = scmutil.revrange(repo, opts['rev'])
                         nodes = [repo[r].node() for r in revs]
                         markers = list(obsutil.getmarkers(repo, nodes=nodes,
                                                            exclusive=opts['exclusive']))
                         markers.sort(key=lambda x: x._data)
                     else:
                         markers = obsutil.getmarkers(repo)
                     markerstoiter = markers
                     isrelevant = lambda m: True
                     if opts.get('rev') and opts.get('index'):
                         markerstoiter = obsutil.getmarkers(repo)
                         markerset = set(markers)
                         isrelevant = lambda m: m in markerset
                     fm = ui.formatter('debugobsolete', opts)
                     for i, m in enumerate(markerstoiter):
                         if not isrelevant(m):
                             # marker can be irrelevant when we're iterating over a set
                             # of markers (markerstoiter) which is bigger than the set
                             # of markers we want to display (markers)
                             # this can happen if both --index and --rev options are
                             # provided and thus we need to iterate over all of the markers
                             # to get the correct indices, but only display the ones that
                             # are relevant to --rev value
                             continue
                         fm.startitem()
                         ind = i if opts.get('index') else None
                         cmdutil.showmarker(fm, m, index=ind)
                     fm.end()
             @command('debugpathcomplete',
                      [('f', 'full', None, _('complete an entire path')),
                       ('n', 'normal', None, _('show only normal files')),
                       ('a', 'added', None, _('show only added files')),
                       ('r', 'removed', None, _('show only removed files'))],
                      _('FILESPEC...'))
             def debugpathcomplete(ui, repo, *specs, **opts):
                 '''complete part or all of a tracked path
                 This command supports shells that offer path name completion. It
                 currently completes only files already known to the dirstate.
                 Completion extends only to the next path segment unless
                 --full is specified, in which case entire paths are used.'''
                 def complete(path, acceptable):
                     dirstate = repo.dirstate
                     spec = os.path.normpath(os.path.join(pycompat.getcwd(), path))
                     rootdir = repo.root + pycompat.ossep
                     if spec != repo.root and not spec.startswith(rootdir):
                         return [], []
                     if os.path.isdir(spec):
                         spec += '/'
                     spec = spec[len(rootdir):]
                     fixpaths = pycompat.ossep != '/'
                     if fixpaths:
                         spec = spec.replace(pycompat.ossep, '/')
                     speclen = len(spec)
                     fullpaths = opts[r'full']
                     files, dirs = set(), set()
                     adddir, addfile = dirs.add, files.add
                     for f, st in dirstate.iteritems():
                         if f.startswith(spec) and st[0] in acceptable:
                             if fixpaths:
                                 f = f.replace('/', pycompat.ossep)
                             if fullpaths:
                                 addfile(f)
                                 continue
                             s = f.find(pycompat.ossep, speclen)
                             if s >= 0:
                                 adddir(f[:s])
                             else:
                                 addfile(f)
                     return files, dirs
                 acceptable = ''
                 if opts[r'normal']:
                     acceptable += 'nm'
                 if opts[r'added']:
                     acceptable += 'a'
                 if opts[r'removed']:
                     acceptable += 'r'
                 cwd = repo.getcwd()
                 if not specs:
                     specs = ['.']
                 files, dirs = set(), set()
                 for spec in specs:
                     f, d = complete(spec, acceptable or 'nmar')
                     files.update(f)
                     dirs.update(d)
                 files.update(dirs)
                 ui.write('\n'.join(repo.pathto(p, cwd) for p in sorted(files)))
                 ui.write('\n')
             @command('debugpeer', [], _('PATH'), norepo=True)
             def debugpeer(ui, path):
                 """establish a connection to a peer repository"""
                 # Always enable peer request logging. Requires --debug to display
                 # though.
                 overrides = {
                     ('devel', 'debug.peer-request'): True,
                 }
                 with ui.configoverride(overrides):
                     peer = hg.peer(ui, {}, path)
                     local = peer.local() is not None
                     canpush = peer.canpush()
                     ui.write(_('url: %s\n') % peer.url())
                     ui.write(_('local: %s\n') % (_('yes') if local else _('no')))
                     ui.write(_('pushable: %s\n') % (_('yes') if canpush else _('no')))
             @command('debugpickmergetool',
                     [('r', 'rev', '', _('check for files in this revision'), _('REV')),
                      ('', 'changedelete', None, _('emulate merging change and delete')),
                     ] + cmdutil.walkopts + cmdutil.mergetoolopts,
                     _('[PATTERN]...'),
                     inferrepo=True)
             def debugpickmergetool(ui, repo, *pats, **opts):
                 """examine which merge tool is chosen for specified file
                 As described in :hg:`help merge-tools`, Mercurial examines
                 configurations below in this order to decide which merge tool is
                 chosen for specified file.
 . ``--tool`` option
 . ``HGMERGE`` environment variable
 . configurations in ``merge-patterns`` section
 . configuration of ``ui.merge``
 . configurations in ``merge-tools`` section
 . ``hgmerge`` tool (for historical reason only)
 . default tool for fallback (``:merge`` or ``:prompt``)
                 This command writes out examination result in the style below::
                     FILE = MERGETOOL
                 By default, all files known in the first parent context of the
                 working directory are examined. Use file patterns and/or -I/-X
                 options to limit target files. -r/--rev is also useful to examine
                 files in another context without actual updating to it.
                 With --debug, this command shows warning messages while matching
                 against ``merge-patterns`` and so on, too. It is recommended to
                 use this option with explicit file patterns and/or -I/-X options,
                 because this option increases amount of output per file according
                 to configurations in hgrc.
                 With -v/--verbose, this command shows configurations below at
                 first (only if specified).
                 - ``--tool`` option
                 - ``HGMERGE`` environment variable
                 - configuration of ``ui.merge``
                 If merge tool is chosen before matching against
                 ``merge-patterns``, this command can't show any helpful
                 information, even with --debug. In such case, information above is
                 useful to know why a merge tool is chosen.
                 """
                 opts = pycompat.byteskwargs(opts)
                 overrides = {}
                 if opts['tool']:
                     overrides[('ui', 'forcemerge')] = opts['tool']
                     ui.note(('with --tool %r\n') % (pycompat.bytestr(opts['tool'])))
                 with ui.configoverride(overrides, 'debugmergepatterns'):
                     hgmerge = encoding.environ.get("HGMERGE")
                     if hgmerge is not None:
                         ui.note(('with HGMERGE=%r\n') % (pycompat.bytestr(hgmerge)))
                     uimerge = ui.config("ui", "merge")
                     if uimerge:
                         ui.note(('with ui.merge=%r\n') % (pycompat.bytestr(uimerge)))
                     ctx = scmutil.revsingle(repo, opts.get('rev'))
                     m = scmutil.match(ctx, pats, opts)
                     changedelete = opts['changedelete']
                     for path in ctx.walk(m):
                         fctx = ctx[path]
                         try:
                             if not ui.debugflag:
                                 ui.pushbuffer(error=True)
                             tool, toolpath = filemerge._picktool(repo, ui, path,
                                                                  fctx.isbinary(),
                                                                  'l' in fctx.flags(),
                                                                  changedelete)
                         finally:
                             if not ui.debugflag:
                                 ui.popbuffer()
                         ui.write(('%s = %s\n') % (path, tool))
             @command('debugpushkey', [], _('REPO NAMESPACE [KEY OLD NEW]'), norepo=True)
             def debugpushkey(ui, repopath, namespace, *keyinfo, **opts):
                 '''access the pushkey key/value protocol
                 With two args, list the keys in the given namespace.
                 With five args, set a key to new if it currently is set to old.
                 Reports success or failure.
                 '''
                 target = hg.peer(ui, {}, repopath)
                 if keyinfo:
                     key, old, new = keyinfo
                     with target.commandexecutor() as e:
                         r = e.callcommand('pushkey', {
                             'namespace': namespace,
                             'key': key,
                             'old': old,
                             'new': new,
                         }).result()
                     ui.status(pycompat.bytestr(r) + '\n')
                     return not r
                 else:
                     for k, v in sorted(target.listkeys(namespace).iteritems()):
                         ui.write("%s\t%s\n" % (stringutil.escapestr(k),
                                                stringutil.escapestr(v)))
             @command('debugpvec', [], _('A B'))
             def debugpvec(ui, repo, a, b=None):
                 ca = scmutil.revsingle(repo, a)
                 cb = scmutil.revsingle(repo, b)
                 pa = pvec.ctxpvec(ca)
                 pb = pvec.ctxpvec(cb)
                 if pa == pb:
                     rel = "="
                 elif pa > pb:
                     rel = ">"
                 elif pa < pb:
                     rel = "<"
                 elif pa | pb:
                     rel = "|"
                 ui.write(_("a: %s\n") % pa)
                 ui.write(_("b: %s\n") % pb)
                 ui.write(_("depth(a): %d depth(b): %d\n") % (pa._depth, pb._depth))
                 ui.write(_("delta: %d hdist: %d distance: %d relation: %s\n") %
                          (abs(pa._depth - pb._depth), pvec._hamming(pa._vec, pb._vec),
                           pa.distance(pb), rel))
             @command('debugrebuilddirstate|debugrebuildstate',
                 [('r', 'rev', '', _('revision to rebuild to'), _('REV')),
                  ('', 'minimal', None, _('only rebuild files that are inconsistent with '
                                          'the working copy parent')),
                 ],
                 _('[-r REV]'))
             def debugrebuilddirstate(ui, repo, rev, **opts):
                 """rebuild the dirstate as it would look like for the given revision
                 If no revision is specified the first current parent will be used.
                 The dirstate will be set to the files of the given revision.
                 The actual working directory content or existing dirstate
                 information such as adds or removes is not considered.
                 ``minimal`` will only rebuild the dirstate status for files that claim to be
                 tracked but are not in the parent manifest, or that exist in the parent
                 manifest but are not in the dirstate. It will not change adds, removes, or
                 modified files that are in the working copy parent.
                 One use of this command is to make the next :hg:`status` invocation
                 check the actual file content.
                 """
                 ctx = scmutil.revsingle(repo, rev)
                 with repo.wlock():
                     dirstate = repo.dirstate
                     changedfiles = None
                     # See command doc for what minimal does.
                     if opts.get(r'minimal'):
                         manifestfiles = set(ctx.manifest().keys())
                         dirstatefiles = set(dirstate)
                         manifestonly = manifestfiles - dirstatefiles
                         dsonly = dirstatefiles - manifestfiles
                         dsnotadded = set(f for f in dsonly if dirstate[f] != 'a')
                         changedfiles = manifestonly | dsnotadded
                     dirstate.rebuild(ctx.node(), ctx.manifest(), changedfiles)
             @command('debugrebuildfncache', [], '')
             def debugrebuildfncache(ui, repo):
                 """rebuild the fncache file"""
                 repair.rebuildfncache(ui, repo)
             @command('debugrename',
                 [('r', 'rev', '', _('revision to debug'), _('REV'))],
                 _('[-r REV] FILE'))
             def debugrename(ui, repo, file1, *pats, **opts):
                 """dump rename information"""
                 opts = pycompat.byteskwargs(opts)
                 ctx = scmutil.revsingle(repo, opts.get('rev'))
                 m = scmutil.match(ctx, (file1,) + pats, opts)
                 for abs in ctx.walk(m):
                     fctx = ctx[abs]
                     o = fctx.filelog().renamed(fctx.filenode())
                     rel = m.rel(abs)
                     if o:
                         ui.write(_("%s renamed from %s:%s\n") % (rel, o[0], hex(o[1])))
                     else:
                         ui.write(_("%s not renamed\n") % rel)
             @command('debugrevlog', cmdutil.debugrevlogopts +
                 [('d', 'dump', False, _('dump index data'))],
                 _('-c|-m|FILE'),
                 optionalrepo=True)
             def debugrevlog(ui, repo, file_=None, **opts):
                 """show data and statistics about a revlog"""
                 opts = pycompat.byteskwargs(opts)
                 r = cmdutil.openrevlog(repo, 'debugrevlog', file_, opts)
                 if opts.get("dump"):
                     numrevs = len(r)
                     ui.write(("# rev p1rev p2rev start   end deltastart base   p1   p2"
                              " rawsize totalsize compression heads chainlen\n"))
                     ts = 0
                     heads = set()
                     for rev in pycompat.xrange(numrevs):
                         dbase = r.deltaparent(rev)
                         if dbase == -1:
                             dbase = rev
                         cbase = r.chainbase(rev)
                         clen = r.chainlen(rev)
                         p1, p2 = r.parentrevs(rev)
                         rs = r.rawsize(rev)
                         ts = ts + rs
                         heads -= set(r.parentrevs(rev))
                         heads.add(rev)
                         try:
                             compression = ts / r.end(rev)
                         except ZeroDivisionError:
                             compression = 0
                         ui.write("%5d %5d %5d %5d %5d %10d %4d %4d %4d %7d %9d "
                                  "%11d %5d %8d\n" %
                                  (rev, p1, p2, r.start(rev), r.end(rev),
                                   r.start(dbase), r.start(cbase),
                                   r.start(p1), r.start(p2),
                                   rs, ts, compression, len(heads), clen))
                     return 0
                 v = r.version
                 format = v & 0xFFFF
                 flags = []
                 gdelta = False
                 if v & revlog.FLAG_INLINE_DATA:
                     flags.append('inline')
                 if v & revlog.FLAG_GENERALDELTA:
                     gdelta = True
                     flags.append('generaldelta')
                 if not flags:
                     flags = ['(none)']
                 ### tracks merge vs single parent
                 nummerges = 0
                 ### tracks ways the "delta" are build
                 # nodelta
                 numempty = 0
                 numemptytext = 0
                 numemptydelta = 0
                 # full file content
                 numfull = 0
                 # intermediate snapshot against a prior snapshot
                 numsemi = 0
                 # snapshot count per depth
                 numsnapdepth = collections.defaultdict(lambda: 0)
                 # delta against previous revision
                 numprev = 0
                 # delta against first or second parent (not prev)
                 nump1 = 0
                 nump2 = 0
                 # delta against neither prev nor parents
                 numother = 0
                 # delta against prev that are also first or second parent
                 # (details of `numprev`)
                 nump1prev = 0
                 nump2prev = 0
                 # data about delta chain of each revs
                 chainlengths = []
                 chainbases = []
                 chainspans = []
                 # data about each revision
                 datasize = [None, 0, 0]
                 fullsize = [None, 0, 0]
                 semisize = [None, 0, 0]
                 # snapshot count per depth
                 snapsizedepth = collections.defaultdict(lambda: [None, 0, 0])
                 deltasize = [None, 0, 0]
                 chunktypecounts = {}
                 chunktypesizes = {}
                 def addsize(size, l):
                     if l[0] is None or size < l[0]:
                         l[0] = size
                     if size > l[1]:
                         l[1] = size
                     l[2] += size
                 numrevs = len(r)
                 for rev in pycompat.xrange(numrevs):
                     p1, p2 = r.parentrevs(rev)
                     delta = r.deltaparent(rev)
                     if format > 0:
                         addsize(r.rawsize(rev), datasize)
                     if p2 != nullrev:
                         nummerges += 1
                     size = r.length(rev)
                     if delta == nullrev:
                         chainlengths.append(0)
                         chainbases.append(r.start(rev))
                         chainspans.append(size)
                         if size == 0:
                             numempty += 1
                             numemptytext += 1
                         else:
                             numfull += 1
                             numsnapdepth[0] += 1
                             addsize(size, fullsize)
                             addsize(size, snapsizedepth[0])
                     else:
                         chainlengths.append(chainlengths[delta] + 1)
                         baseaddr = chainbases[delta]
                         revaddr = r.start(rev)
                         chainbases.append(baseaddr)
                         chainspans.append((revaddr - baseaddr) + size)
                         if size == 0:
                             numempty += 1
                             numemptydelta += 1
                         elif r.issnapshot(rev):
                             addsize(size, semisize)
                             numsemi += 1
                             depth = r.snapshotdepth(rev)
                             numsnapdepth[depth] += 1
                             addsize(size, snapsizedepth[depth])
                         else:
                             addsize(size, deltasize)
                             if delta == rev - 1:
                                 numprev += 1
                                 if delta == p1:
                                     nump1prev += 1
                                 elif delta == p2:
                                     nump2prev += 1
                             elif delta == p1:
                                 nump1 += 1
                             elif delta == p2:
                                 nump2 += 1
                             elif delta != nullrev:
                                 numother += 1
                     # Obtain data on the raw chunks in the revlog.
                     if util.safehasattr(r, '_getsegmentforrevs'):
                         segment = r._getsegmentforrevs(rev, rev)[1]
                     else:
                         segment = r._revlog._getsegmentforrevs(rev, rev)[1]
                     if segment:
                         chunktype = bytes(segment[0:1])
                     else:
                         chunktype = 'empty'
                     if chunktype not in chunktypecounts:
                         chunktypecounts[chunktype] = 0
                         chunktypesizes[chunktype] = 0
                     chunktypecounts[chunktype] += 1
                     chunktypesizes[chunktype] += size
                 # Adjust size min value for empty cases
                 for size in (datasize, fullsize, semisize, deltasize):
                     if size[0] is None:
                         size[0] = 0
                 numdeltas = numrevs - numfull - numempty - numsemi
                 numoprev = numprev - nump1prev - nump2prev
                 totalrawsize = datasize[2]
                 datasize[2] /= numrevs
                 fulltotal = fullsize[2]
                 fullsize[2] /= numfull
                 semitotal = semisize[2]
                 snaptotal = {}
                 if 0 < numsemi:
                     semisize[2] /= numsemi
                 for depth in snapsizedepth:
                     snaptotal[depth] = snapsizedepth[depth][2]
                     snapsizedepth[depth][2] /= numsnapdepth[depth]
                 deltatotal = deltasize[2]
                 if numdeltas > 0:
                     deltasize[2] /= numdeltas
                 totalsize = fulltotal + semitotal + deltatotal
                 avgchainlen = sum(chainlengths) / numrevs
                 maxchainlen = max(chainlengths)
                 maxchainspan = max(chainspans)
                 compratio = 1
                 if totalsize:
                     compratio = totalrawsize / totalsize
                 basedfmtstr = '%%%dd\n'
                 basepcfmtstr = '%%%dd %s(%%5.2f%%%%)\n'
                 def dfmtstr(max):
                     return basedfmtstr % len(str(max))
                 def pcfmtstr(max, padding=0):
                     return basepcfmtstr % (len(str(max)), ' ' * padding)
                 def pcfmt(value, total):
                     if total:
                         return (value, 100 * float(value) / total)
                     else:
                         return value, 100.0
                 ui.write(('format : %d\n') % format)
                 ui.write(('flags  : %s\n') % ', '.join(flags))
                 ui.write('\n')
                 fmt = pcfmtstr(totalsize)
                 fmt2 = dfmtstr(totalsize)
                 ui.write(('revisions     : ') + fmt2 % numrevs)
                 ui.write(('    merges    : ') + fmt % pcfmt(nummerges, numrevs))
                 ui.write(('    normal    : ') + fmt % pcfmt(numrevs - nummerges, numrevs))
                 ui.write(('revisions     : ') + fmt2 % numrevs)
                 ui.write(('    empty     : ') + fmt % pcfmt(numempty, numrevs))
                 ui.write(('                   text  : ')
                          + fmt % pcfmt(numemptytext, numemptytext + numemptydelta))
                 ui.write(('                   delta : ')
                          + fmt % pcfmt(numemptydelta, numemptytext + numemptydelta))
                 ui.write(('    snapshot  : ') + fmt % pcfmt(numfull + numsemi, numrevs))
                 for depth in sorted(numsnapdepth):
                     ui.write(('      lvl-%-3d :       ' % depth)
                              + fmt % pcfmt(numsnapdepth[depth], numrevs))
                 ui.write(('    deltas    : ') + fmt % pcfmt(numdeltas, numrevs))
                 ui.write(('revision size : ') + fmt2 % totalsize)
                 ui.write(('    snapshot  : ')
                          + fmt % pcfmt(fulltotal + semitotal, totalsize))
                 for depth in sorted(numsnapdepth):
                     ui.write(('      lvl-%-3d :       ' % depth)
                              + fmt % pcfmt(snaptotal[depth], totalsize))
                 ui.write(('    deltas    : ') + fmt % pcfmt(deltatotal, totalsize))
                 def fmtchunktype(chunktype):
                     if chunktype == 'empty':
                         return '    %s     : ' % chunktype
                     elif chunktype in pycompat.bytestr(string.ascii_letters):
                         return '    0x%s (%s)  : ' % (hex(chunktype), chunktype)
                     else:
                         return '    0x%s      : ' % hex(chunktype)
                 ui.write('\n')
                 ui.write(('chunks        : ') + fmt2 % numrevs)
                 for chunktype in sorted(chunktypecounts):
                     ui.write(fmtchunktype(chunktype))
                     ui.write(fmt % pcfmt(chunktypecounts[chunktype], numrevs))
                 ui.write(('chunks size   : ') + fmt2 % totalsize)
                 for chunktype in sorted(chunktypecounts):
                     ui.write(fmtchunktype(chunktype))
                     ui.write(fmt % pcfmt(chunktypesizes[chunktype], totalsize))
                 ui.write('\n')
                 fmt = dfmtstr(max(avgchainlen, maxchainlen, maxchainspan, compratio))
                 ui.write(('avg chain length  : ') + fmt % avgchainlen)
                 ui.write(('max chain length  : ') + fmt % maxchainlen)
                 ui.write(('max chain reach   : ') + fmt % maxchainspan)
                 ui.write(('compression ratio : ') + fmt % compratio)
                 if format > 0:
                     ui.write('\n')
                     ui.write(('uncompressed data size (min/max/avg) : %d / %d / %d\n')
                              % tuple(datasize))
                 ui.write(('full revision size (min/max/avg)     : %d / %d / %d\n')
                          % tuple(fullsize))
                 ui.write(('inter-snapshot size (min/max/avg)    : %d / %d / %d\n')
                          % tuple(semisize))
                 for depth in sorted(snapsizedepth):
                     if depth == 0:
                         continue
                     ui.write(('    level-%-3d (min/max/avg)          : %d / %d / %d\n')
                              % ((depth,) + tuple(snapsizedepth[depth])))
                 ui.write(('delta size (min/max/avg)             : %d / %d / %d\n')
                          % tuple(deltasize))
                 if numdeltas > 0:
                     ui.write('\n')
                     fmt = pcfmtstr(numdeltas)
                     fmt2 = pcfmtstr(numdeltas, 4)
                     ui.write(('deltas against prev  : ') + fmt % pcfmt(numprev, numdeltas))
                     if numprev > 0:
                         ui.write(('    where prev = p1  : ') + fmt2 % pcfmt(nump1prev,
                                                                           numprev))
                         ui.write(('    where prev = p2  : ') + fmt2 % pcfmt(nump2prev,
                                                                           numprev))
                         ui.write(('    other            : ') + fmt2 % pcfmt(numoprev,
                                                                           numprev))
                     if gdelta:
                         ui.write(('deltas against p1    : ')
                                  + fmt % pcfmt(nump1, numdeltas))
                         ui.write(('deltas against p2    : ')
                                  + fmt % pcfmt(nump2, numdeltas))
                         ui.write(('deltas against other : ') + fmt % pcfmt(numother,
                                                                          numdeltas))
             @command('debugrevlogindex', cmdutil.debugrevlogopts +
                 [('f', 'format', 0, _('revlog format'), _('FORMAT'))],
                 _('[-f FORMAT] -c|-m|FILE'),
                 optionalrepo=True)
             def debugrevlogindex(ui, repo, file_=None, **opts):
                 """dump the contents of a revlog index"""
                 opts = pycompat.byteskwargs(opts)
                 r = cmdutil.openrevlog(repo, 'debugrevlogindex', file_, opts)
                 format = opts.get('format', 0)
                 if format not in (0, 1):
                     raise error.Abort(_("unknown format %d") % format)
                 if ui.debugflag:
                     shortfn = hex
                 else:
                     shortfn = short
                 # There might not be anything in r, so have a sane default
                 idlen = 12
                 for i in r:
                     idlen = len(shortfn(r.node(i)))
                     break
                 if format == 0:
                     if ui.verbose:
                         ui.write(("   rev    offset  length linkrev"
                                  " %s %s p2\n") % ("nodeid".ljust(idlen),
                                                    "p1".ljust(idlen)))
                     else:
                         ui.write(("   rev linkrev %s %s p2\n") % (
                             "nodeid".ljust(idlen), "p1".ljust(idlen)))
                 elif format == 1:
                     if ui.verbose:
                         ui.write(("   rev flag   offset   length     size   link     p1"
                                   "     p2 %s\n") % "nodeid".rjust(idlen))
                     else:
                         ui.write(("   rev flag     size   link     p1     p2 %s\n") %
                                  "nodeid".rjust(idlen))
                 for i in r:
                     node = r.node(i)
                     if format == 0:
                         try:
                             pp = r.parents(node)
                         except Exception:
                             pp = [nullid, nullid]
                         if ui.verbose:
                             ui.write("% 6d % 9d % 7d % 7d %s %s %s\n" % (
                                     i, r.start(i), r.length(i), r.linkrev(i),
                                     shortfn(node), shortfn(pp[0]), shortfn(pp[1])))
                         else:
                             ui.write("% 6d % 7d %s %s %s\n" % (
                                 i, r.linkrev(i), shortfn(node), shortfn(pp[0]),
                                 shortfn(pp[1])))
                     elif format == 1:
                         pr = r.parentrevs(i)
                         if ui.verbose:
                             ui.write("% 6d %04x % 8d % 8d % 8d % 6d % 6d % 6d %s\n" % (
                                     i, r.flags(i), r.start(i), r.length(i), r.rawsize(i),
                                     r.linkrev(i), pr[0], pr[1], shortfn(node)))
                         else:
                             ui.write("% 6d %04x % 8d % 6d % 6d % 6d %s\n" % (
                                 i, r.flags(i), r.rawsize(i), r.linkrev(i), pr[0], pr[1],
                                 shortfn(node)))
             @command('debugrevspec',
                 [('', 'optimize', None,
                   _('print parsed tree after optimizing (DEPRECATED)')),
                  ('', 'show-revs', True, _('print list of result revisions (default)')),
                  ('s', 'show-set', None, _('print internal representation of result set')),
                  ('p', 'show-stage', [],
                   _('print parsed tree at the given stage'), _('NAME')),
                  ('', 'no-optimized', False, _('evaluate tree without optimization')),
                  ('', 'verify-optimized', False, _('verify optimized result')),
                  ],
                 ('REVSPEC'))
             def debugrevspec(ui, repo, expr, **opts):
                 """parse and apply a revision specification
                 Use -p/--show-stage option to print the parsed tree at the given stages.
                 Use -p all to print tree at every stage.
                 Use --no-show-revs option with -s or -p to print only the set
                 representation or the parsed tree respectively.
                 Use --verify-optimized to compare the optimized result with the unoptimized
                 one. Returns 1 if the optimized result differs.
                 """
                 opts = pycompat.byteskwargs(opts)
                 aliases = ui.configitems('revsetalias')
                 stages = [
                     ('parsed', lambda tree: tree),
                     ('expanded', lambda tree: revsetlang.expandaliases(tree, aliases,
                                                                        ui.warn)),
                     ('concatenated', revsetlang.foldconcat),
                     ('analyzed', revsetlang.analyze),
                     ('optimized', revsetlang.optimize),
                 ]
                 if opts['no_optimized']:
                     stages = stages[:-1]
                 if opts['verify_optimized'] and opts['no_optimized']:
                     raise error.Abort(_('cannot use --verify-optimized with '
                                         '--no-optimized'))
                 stagenames = set(n for n, f in stages)
                 showalways = set()
                 showchanged = set()
                 if ui.verbose and not opts['show_stage']:
                     # show parsed tree by --verbose (deprecated)
                     showalways.add('parsed')
                     showchanged.update(['expanded', 'concatenated'])
                     if opts['optimize']:
                         showalways.add('optimized')
                 if opts['show_stage'] and opts['optimize']:
                     raise error.Abort(_('cannot use --optimize with --show-stage'))
                 if opts['show_stage'] == ['all']:
                     showalways.update(stagenames)
                 else:
                     for n in opts['show_stage']:
                         if n not in stagenames:
                             raise error.Abort(_('invalid stage name: %s') % n)
                     showalways.update(opts['show_stage'])
                 treebystage = {}
                 printedtree = None
                 tree = revsetlang.parse(expr, lookup=revset.lookupfn(repo))
                 for n, f in stages:
                     treebystage[n] = tree = f(tree)
                     if n in showalways or (n in showchanged and tree != printedtree):
                         if opts['show_stage'] or n != 'parsed':
                             ui.write(("* %s:\n") % n)
                         ui.write(revsetlang.prettyformat(tree), "\n")
                         printedtree = tree
                 if opts['verify_optimized']:
                     arevs = revset.makematcher(treebystage['analyzed'])(repo)
                     brevs = revset.makematcher(treebystage['optimized'])(repo)
                     if opts['show_set'] or (opts['show_set'] is None and ui.verbose):
                         ui.write(("* analyzed set:\n"), stringutil.prettyrepr(arevs), "\n")
                         ui.write(("* optimized set:\n"), stringutil.prettyrepr(brevs), "\n")
                     arevs = list(arevs)
                     brevs = list(brevs)
                     if arevs == brevs:
                         return 0
                     ui.write(('--- analyzed\n'), label='diff.file_a')
                     ui.write(('+++ optimized\n'), label='diff.file_b')
                     sm = difflib.SequenceMatcher(None, arevs, brevs)
                     for tag, alo, ahi, blo, bhi in sm.get_opcodes():
                         if tag in ('delete', 'replace'):
                             for c in arevs[alo:ahi]:
                                 ui.write('-%s\n' % c, label='diff.deleted')
                         if tag in ('insert', 'replace'):
                             for c in brevs[blo:bhi]:
                                 ui.write('+%s\n' % c, label='diff.inserted')
                         if tag == 'equal':
                             for c in arevs[alo:ahi]:
                                 ui.write(' %s\n' % c)
                     return 1
                 func = revset.makematcher(tree)
                 revs = func(repo)
                 if opts['show_set'] or (opts['show_set'] is None and ui.verbose):
                     ui.write(("* set:\n"), stringutil.prettyrepr(revs), "\n")
                 if not opts['show_revs']:
                     return
                 for c in revs:
                     ui.write("%d\n" % c)
             @command('debugserve', [
                 ('', 'sshstdio', False, _('run an SSH server bound to process handles')),
                 ('', 'logiofd', '', _('file descriptor to log server I/O to')),
                 ('', 'logiofile', '', _('file to log server I/O to')),
             ], '')
             def debugserve(ui, repo, **opts):
                 """run a server with advanced settings
                 This command is similar to :hg:`serve`. It exists partially as a
                 workaround to the fact that ``hg serve --stdio`` must have specific
                 arguments for security reasons.
                 """
                 opts = pycompat.byteskwargs(opts)
                 if not opts['sshstdio']:
                     raise error.Abort(_('only --sshstdio is currently supported'))
                 logfh = None
                 if opts['logiofd'] and opts['logiofile']:
                     raise error.Abort(_('cannot use both --logiofd and --logiofile'))
                 if opts['logiofd']:
                     # Line buffered because output is line based.
                     try:
                         logfh = os.fdopen(int(opts['logiofd']), r'ab', 1)
                     except OSError as e:
                         if e.errno != errno.ESPIPE:
                             raise
                         # can't seek a pipe, so `ab` mode fails on py3
                         logfh = os.fdopen(int(opts['logiofd']), r'wb', 1)
                 elif opts['logiofile']:
                     logfh = open(opts['logiofile'], 'ab', 1)
                 s = wireprotoserver.sshserver(ui, repo, logfh=logfh)
                 s.serve_forever()
             @command('debugsetparents', [], _('REV1 [REV2]'))
             def debugsetparents(ui, repo, rev1, rev2=None):
                 """manually set the parents of the current working directory
                 This is useful for writing repository conversion tools, but should
                 be used with care. For example, neither the working directory nor the
                 dirstate is updated, so file status may be incorrect after running this
                 command.
                 Returns 0 on success.
                 """
                 node1 = scmutil.revsingle(repo, rev1).node()
                 node2 = scmutil.revsingle(repo, rev2, 'null').node()
                 with repo.wlock():
                     repo.setparents(node1, node2)
             @command('debugssl', [], '[SOURCE]', optionalrepo=True)
             def debugssl(ui, repo, source=None, **opts):
                 '''test a secure connection to a server
                 This builds the certificate chain for the server on Windows, installing the
                 missing intermediates and trusted root via Windows Update if necessary.  It
                 does nothing on other platforms.
                 If SOURCE is omitted, the 'default' path will be used.  If a URL is given,
                 that server is used. See :hg:`help urls` for more information.
                 If the update succeeds, retry the original operation.  Otherwise, the cause
                 of the SSL error is likely another issue.
                 '''
                 if not pycompat.iswindows:
                     raise error.Abort(_('certificate chain building is only possible on '
                                         'Windows'))
                 if not source:
                     if not repo:
                         raise error.Abort(_("there is no Mercurial repository here, and no "
                                             "server specified"))
                     source = "default"
                 source, branches = hg.parseurl(ui.expandpath(source))
                 url = util.url(source)
                 addr = None
                 defaultport = {'https': 443, 'ssh': 22}
                 if url.scheme in defaultport:
                     try:
                         addr = (url.host, int(url.port or defaultport[url.scheme]))
                     except ValueError:
                         raise error.Abort(_("malformed port number in URL"))
                 else:
                     raise error.Abort(_("only https and ssh connections are supported"))
                 from . import win32
                 s = ssl.wrap_socket(socket.socket(), ssl_version=ssl.PROTOCOL_TLS,
                                     cert_reqs=ssl.CERT_NONE, ca_certs=None)
                 try:
                     s.connect(addr)
                     cert = s.getpeercert(True)
                     ui.status(_('checking the certificate chain for %s\n') % url.host)
                     complete = win32.checkcertificatechain(cert, build=False)
                     if not complete:
                         ui.status(_('certificate chain is incomplete, updating... '))
                         if not win32.checkcertificatechain(cert):
                             ui.status(_('failed.\n'))
                         else:
                             ui.status(_('done.\n'))
                     else:
                         ui.status(_('full certificate chain is available\n'))
                 finally:
                     s.close()
             @command('debugsub',
                 [('r', 'rev', '',
                  _('revision to check'), _('REV'))],
                 _('[-r REV] [REV]'))
             def debugsub(ui, repo, rev=None):
                 ctx = scmutil.revsingle(repo, rev, None)
                 for k, v in sorted(ctx.substate.items()):
                     ui.write(('path %s\n') % k)
                     ui.write((' source   %s\n') % v[0])
                     ui.write((' revision %s\n') % v[1])
             @command('debugsuccessorssets',
                 [('', 'closest', False, _('return closest successors sets only'))],
                 _('[REV]'))
             def debugsuccessorssets(ui, repo, *revs, **opts):
                 """show set of successors for revision
                 A successors set of changeset A is a consistent group of revisions that
                 succeed A. It contains non-obsolete changesets only unless closests
                 successors set is set.
                 In most cases a changeset A has a single successors set containing a single
                 successor (changeset A replaced by A').
                 A changeset that is made obsolete with no successors are called "pruned".
                 Such changesets have no successors sets at all.
                 A changeset that has been "split" will have a successors set containing
                 more than one successor.
                 A changeset that has been rewritten in multiple different ways is called
                 "divergent". Such changesets have multiple successor sets (each of which
                 may also be split, i.e. have multiple successors).
                 Results are displayed as follows::
                     <rev1>
                         <successors-1A>
                     <rev2>
                         <successors-2A>
                         <successors-2B1> <successors-2B2> <successors-2B3>
                 Here rev2 has two possible (i.e. divergent) successors sets. The first
                 holds one element, whereas the second holds three (i.e. the changeset has
                 been split).
                 """
                 # passed to successorssets caching computation from one call to another
                 cache = {}
                 ctx2str = bytes
                 node2str = short
                 for rev in scmutil.revrange(repo, revs):
                     ctx = repo[rev]
                     ui.write('%s\n'% ctx2str(ctx))
                     for succsset in obsutil.successorssets(repo, ctx.node(),
                                                             closest=opts[r'closest'],
                                                             cache=cache):
                         if succsset:
                             ui.write('    ')
                             ui.write(node2str(succsset[0]))
                             for node in succsset[1:]:
                                 ui.write(' ')
                                 ui.write(node2str(node))
                         ui.write('\n')
             @command('debugtemplate',
                 [('r', 'rev', [], _('apply template on changesets'), _('REV')),
                  ('D', 'define', [], _('define template keyword'), _('KEY=VALUE'))],
                 _('[-r REV]... [-D KEY=VALUE]... TEMPLATE'),
                 optionalrepo=True)
             def debugtemplate(ui, repo, tmpl, **opts):
                 """parse and apply a template
                 If -r/--rev is given, the template is processed as a log template and
                 applied to the given changesets. Otherwise, it is processed as a generic
                 template.
                 Use --verbose to print the parsed tree.
                 """
                 revs = None
                 if opts[r'rev']:
                     if repo is None:
                         raise error.RepoError(_('there is no Mercurial repository here '
                                                 '(.hg not found)'))
                     revs = scmutil.revrange(repo, opts[r'rev'])
                 props = {}
                 for d in opts[r'define']:
                     try:
                         k, v = (e.strip() for e in d.split('=', 1))
                         if not k or k == 'ui':
                             raise ValueError
                         props[k] = v
                     except ValueError:
                         raise error.Abort(_('malformed keyword definition: %s') % d)
                 if ui.verbose:
                     aliases = ui.configitems('templatealias')
                     tree = templater.parse(tmpl)
                     ui.note(templater.prettyformat(tree), '\n')
                     newtree = templater.expandaliases(tree, aliases)
                     if newtree != tree:
                         ui.note(("* expanded:\n"), templater.prettyformat(newtree), '\n')
                 if revs is None:
                     tres = formatter.templateresources(ui, repo)
                     t = formatter.maketemplater(ui, tmpl, resources=tres)
                     if ui.verbose:
                         kwds, funcs = t.symbolsuseddefault()
                         ui.write(("* keywords: %s\n") % ', '.join(sorted(kwds)))
                         ui.write(("* functions: %s\n") % ', '.join(sorted(funcs)))
                     ui.write(t.renderdefault(props))
                 else:
                     displayer = logcmdutil.maketemplater(ui, repo, tmpl)
                     if ui.verbose:
                         kwds, funcs = displayer.t.symbolsuseddefault()
                         ui.write(("* keywords: %s\n") % ', '.join(sorted(kwds)))
                         ui.write(("* functions: %s\n") % ', '.join(sorted(funcs)))
                     for r in revs:
                         displayer.show(repo[r], **pycompat.strkwargs(props))
                     displayer.close()
             @command('debuguigetpass', [
                 ('p', 'prompt', '', _('prompt text'), _('TEXT')),
             ], _('[-p TEXT]'), norepo=True)
             def debuguigetpass(ui, prompt=''):
                 """show prompt to type password"""
                 r = ui.getpass(prompt)
                 ui.write(('respose: %s\n') % r)
             @command('debuguiprompt', [
                 ('p', 'prompt', '', _('prompt text'), _('TEXT')),
             ], _('[-p TEXT]'), norepo=True)
             def debuguiprompt(ui, prompt=''):
                 """show plain prompt"""
                 r = ui.prompt(prompt)
                 ui.write(('response: %s\n') % r)
             @command('debugupdatecaches', [])
             def debugupdatecaches(ui, repo, *pats, **opts):
                 """warm all known caches in the repository"""
                 with repo.wlock(), repo.lock():
                     repo.updatecaches(full=True)
             @command('debugupgraderepo', [
                 ('o', 'optimize', [], _('extra optimization to perform'), _('NAME')),
                 ('', 'run', False, _('performs an upgrade')),
             ])
             def debugupgraderepo(ui, repo, run=False, optimize=None):
                 """upgrade a repository to use different features
                 If no arguments are specified, the repository is evaluated for upgrade
                 and a list of problems and potential optimizations is printed.
                 With ``--run``, a repository upgrade is performed. Behavior of the upgrade
                 can be influenced via additional arguments. More details will be provided
                 by the command output when run without ``--run``.
                 During the upgrade, the repository will be locked and no writes will be
                 allowed.
                 At the end of the upgrade, the repository may not be readable while new
                 repository data is swapped in. This window will be as long as it takes to
                 rename some directories inside the ``.hg`` directory. On most machines, this
                 should complete almost instantaneously and the chances of a consumer being
                 unable to access the repository should be low.
                 """
                 return upgrade.upgraderepo(ui, repo, run=run, optimize=optimize)
             @command('debugwalk', cmdutil.walkopts, _('[OPTION]... [FILE]...'),
                      inferrepo=True)
             def debugwalk(ui, repo, *pats, **opts):
                 """show how files match on given patterns"""
                 opts = pycompat.byteskwargs(opts)
                 m = scmutil.match(repo[None], pats, opts)
                 if ui.verbose:
                     ui.write(('* matcher:\n'), stringutil.prettyrepr(m), '\n')
                 items = list(repo[None].walk(m))
                 if not items:
                     return
                 f = lambda fn: fn
                 if ui.configbool('ui', 'slash') and pycompat.ossep != '/':
                     f = lambda fn: util.normpath(fn)
                 fmt = 'f  %%-%ds  %%-%ds  %%s' % (
                     max([len(abs) for abs in items]),
                     max([len(m.rel(abs)) for abs in items]))
                 for abs in items:
                     line = fmt % (abs, f(m.rel(abs)), m.exact(abs) and 'exact' or '')
                     ui.write("%s\n" % line.rstrip())
             @command('debugwhyunstable', [], _('REV'))
             def debugwhyunstable(ui, repo, rev):
                 """explain instabilities of a changeset"""
                 for entry in obsutil.whyunstable(repo, scmutil.revsingle(repo, rev)):
                     dnodes = ''
                     if entry.get('divergentnodes'):
                         dnodes = ' '.join('%s (%s)' % (ctx.hex(), ctx.phasestr())
                                           for ctx in entry['divergentnodes']) + ' '
                     ui.write('%s: %s%s %s\n' % (entry['instability'], dnodes,
                                                 entry['reason'], entry['node']))
             @command('debugwireargs',
                 [('', 'three', '', 'three'),
                 ('', 'four', '', 'four'),
                 ('', 'five', '', 'five'),
                 ] + cmdutil.remoteopts,
                 _('REPO [OPTIONS]... [ONE [TWO]]'),
                 norepo=True)
             def debugwireargs(ui, repopath, *vals, **opts):
                 opts = pycompat.byteskwargs(opts)
                 repo = hg.peer(ui, opts, repopath)
                 for opt in cmdutil.remoteopts:
                     del opts[opt[1]]
                 args = {}
                 for k, v in opts.iteritems():
                     if v:
                         args[k] = v
                 args = pycompat.strkwargs(args)
                 # run twice to check that we don't mess up the stream for the next command
                 res1 = repo.debugwireargs(*vals, **args)
                 res2 = repo.debugwireargs(*vals, **args)
                 ui.write("%s\n" % res1)
                 if res1 != res2:
                     ui.warn("%s\n" % res2)
             def _parsewirelangblocks(fh):
                 activeaction = None
                 blocklines = []
                 for line in fh:
                     line = line.rstrip()
                     if not line:
                         continue
                     if line.startswith(b'#'):
                         continue
                     if not line.startswith(b' '):
                         # New block. Flush previous one.
                         if activeaction:
                             yield activeaction, blocklines
                         activeaction = line
                         blocklines = []
                         continue
                     # Else we start with an indent.
                     if not activeaction:
                         raise error.Abort(_('indented line outside of block'))
                     blocklines.append(line)
                 # Flush last block.
                 if activeaction:
                     yield activeaction, blocklines
             @command('debugwireproto',
                 [
                     ('', 'localssh', False, _('start an SSH server for this repo')),
                     ('', 'peer', '', _('construct a specific version of the peer')),
                     ('', 'noreadstderr', False, _('do not read from stderr of the remote')),
                     ('', 'nologhandshake', False,
                      _('do not log I/O related to the peer handshake')),
                 ] + cmdutil.remoteopts,
                 _('[PATH]'),
                 optionalrepo=True)
             def debugwireproto(ui, repo, path=None, **opts):
                 """send wire protocol commands to a server
                 This command can be used to issue wire protocol commands to remote
                 peers and to debug the raw data being exchanged.
                 ``--localssh`` will start an SSH server against the current repository
                 and connect to that. By default, the connection will perform a handshake
                 and establish an appropriate peer instance.
                 ``--peer`` can be used to bypass the handshake protocol and construct a
                 peer instance using the specified class type. Valid values are ``raw``,
                 ``http2``, ``ssh1``, and ``ssh2``. ``raw`` instances only allow sending
                 raw data payloads and don't support higher-level command actions.
                 ``--noreadstderr`` can be used to disable automatic reading from stderr
                 of the peer (for SSH connections only). Disabling automatic reading of
                 stderr is useful for making output more deterministic.
                 Commands are issued via a mini language which is specified via stdin.
                 The language consists of individual actions to perform. An action is
                 defined by a block. A block is defined as a line with no leading
                 space followed by 0 or more lines with leading space. Blocks are
                 effectively a high-level command with additional metadata.
                 Lines beginning with ``#`` are ignored.
                 The following sections denote available actions.
                 raw
                 ---
                 Send raw data to the server.
                 The block payload contains the raw data to send as one atomic send
                 operation. The data may not actually be delivered in a single system
                 call: it depends on the abilities of the transport being used.
                 Each line in the block is de-indented and concatenated. Then, that
                 value is evaluated as a Python b'' literal. This allows the use of
                 backslash escaping, etc.
                 raw+
                 ----
                 Behaves like ``raw`` except flushes output afterwards.
                 command <X>
                 -----------
                 Send a request to run a named command, whose name follows the ``command``
                 string.
                 Arguments to the command are defined as lines in this block. The format of
                 each line is ``<key> <value>``. e.g.::
                    command listkeys
                        namespace bookmarks
                 If the value begins with ``eval:``, it will be interpreted as a Python
                 literal expression. Otherwise values are interpreted as Python b'' literals.
                 This allows sending complex types and encoding special byte sequences via
                 backslash escaping.
                 The following arguments have special meaning:
                 ``PUSHFILE``
                     When defined, the *push* mechanism of the peer will be used instead
                     of the static request-response mechanism and the content of the
                     file specified in the value of this argument will be sent as the
                     command payload.
                     This can be used to submit a local bundle file to the remote.
                 batchbegin
                 ----------
                 Instruct the peer to begin a batched send.
                 All ``command`` blocks are queued for execution until the next
                 ``batchsubmit`` block.
                 batchsubmit
                 -----------
                 Submit previously queued ``command`` blocks as a batch request.
                 This action MUST be paired with a ``batchbegin`` action.
                 httprequest <method> <path>
                 ---------------------------
                 (HTTP peer only)
                 Send an HTTP request to the peer.
                 The HTTP request line follows the ``httprequest`` action. e.g. ``GET /foo``.
                 Arguments of the form ``<key>: <value>`` are interpreted as HTTP request
                 headers to add to the request. e.g. ``Accept: foo``.
                 The following arguments are special:
                 ``BODYFILE``
                     The content of the file defined as the value to this argument will be
                     transferred verbatim as the HTTP request body.
                 ``frame <type> <flags> <payload>``
                     Send a unified protocol frame as part of the request body.
                     All frames will be collected and sent as the body to the HTTP
                     request.
                 close
                 -----
                 Close the connection to the server.
                 flush
                 -----
                 Flush data written to the server.
                 readavailable
                 -------------
                 Close the write end of the connection and read all available data from
                 the server.
                 If the connection to the server encompasses multiple pipes, we poll both
                 pipes and read available data.
                 readline
                 --------
                 Read a line of output from the server. If there are multiple output
                 pipes, reads only the main pipe.
                 ereadline
                 ---------
                 Like ``readline``, but read from the stderr pipe, if available.
                 read <X>
                 --------
                 ``read()`` N bytes from the server's main output pipe.
                 eread <X>
                 ---------
                 ``read()`` N bytes from the server's stderr pipe, if available.
                 Specifying Unified Frame-Based Protocol Frames
                 ----------------------------------------------
                 It is possible to emit a *Unified Frame-Based Protocol* by using special
                 syntax.
                 A frame is composed as a type, flags, and payload. These can be parsed
                 from a string of the form:
                    <request-id> <stream-id> <stream-flags> <type> <flags> <payload>
                 ``request-id`` and ``stream-id`` are integers defining the request and
                 stream identifiers.
                 ``type`` can be an integer value for the frame type or the string name
                 of the type. The strings are defined in ``wireprotoframing.py``. e.g.
                 ``command-name``.
                 ``stream-flags`` and ``flags`` are a ``|`` delimited list of flag
                 components. Each component (and there can be just one) can be an integer
                 or a flag name for stream flags or frame flags, respectively. Values are
                 resolved to integers and then bitwise OR'd together.
                 ``payload`` represents the raw frame payload. If it begins with
                 ``cbor:``, the following string is evaluated as Python code and the
                 resulting object is fed into a CBOR encoder. Otherwise it is interpreted
                 as a Python byte string literal.
                 """
                 opts = pycompat.byteskwargs(opts)
                 if opts['localssh'] and not repo:
                     raise error.Abort(_('--localssh requires a repository'))
                 if opts['peer'] and opts['peer'] not in ('raw', 'http2', 'ssh1', 'ssh2'):
                     raise error.Abort(_('invalid value for --peer'),
                                       hint=_('valid values are "raw", "ssh1", and "ssh2"'))
                 if path and opts['localssh']:
                     raise error.Abort(_('cannot specify --localssh with an explicit '
                                         'path'))
                 if ui.interactive():
                     ui.write(_('(waiting for commands on stdin)\n'))
                 blocks = list(_parsewirelangblocks(ui.fin))
                 proc = None
                 stdin = None
                 stdout = None
                 stderr = None
                 opener = None
                 if opts['localssh']:
                     # We start the SSH server in its own process so there is process
                     # separation. This prevents a whole class of potential bugs around
                     # shared state from interfering with server operation.
                     args = procutil.hgcmd() + [
                         '-R', repo.root,
                         'debugserve', '--sshstdio',
                     ]
                     proc = subprocess.Popen(args, stdin=subprocess.PIPE,
                                             stdout=subprocess.PIPE, stderr=subprocess.PIPE,
                                             bufsize=0)
                     stdin = proc.stdin
                     stdout = proc.stdout
                     stderr = proc.stderr
                     # We turn the pipes into observers so we can log I/O.
                     if ui.verbose or opts['peer'] == 'raw':
                         stdin = util.makeloggingfileobject(ui, proc.stdin, b'i',
                                                            logdata=True)
                         stdout = util.makeloggingfileobject(ui, proc.stdout, b'o',
                                                             logdata=True)
                         stderr = util.makeloggingfileobject(ui, proc.stderr, b'e',
                                                             logdata=True)
                     # --localssh also implies the peer connection settings.
                     url = 'ssh://localserver'
                     autoreadstderr = not opts['noreadstderr']
                     if opts['peer'] == 'ssh1':
                         ui.write(_('creating ssh peer for wire protocol version 1\n'))
                         peer = sshpeer.sshv1peer(ui, url, proc, stdin, stdout, stderr,
                                                  None, autoreadstderr=autoreadstderr)
                     elif opts['peer'] == 'ssh2':
                         ui.write(_('creating ssh peer for wire protocol version 2\n'))
                         peer = sshpeer.sshv2peer(ui, url, proc, stdin, stdout, stderr,
                                                  None, autoreadstderr=autoreadstderr)
                     elif opts['peer'] == 'raw':
                         ui.write(_('using raw connection to peer\n'))
                         peer = None
                     else:
                         ui.write(_('creating ssh peer from handshake results\n'))
                         peer = sshpeer.makepeer(ui, url, proc, stdin, stdout, stderr,
                                                 autoreadstderr=autoreadstderr)
                 elif path:
                     # We bypass hg.peer() so we can proxy the sockets.
                     # TODO consider not doing this because we skip
                     # ``hg.wirepeersetupfuncs`` and potentially other useful functionality.
                     u = util.url(path)
                     if u.scheme != 'http':
                         raise error.Abort(_('only http:// paths are currently supported'))
                     url, authinfo = u.authinfo()
                     openerargs = {
                         r'useragent': b'Mercurial debugwireproto',
                     }
                     # Turn pipes/sockets into observers so we can log I/O.
                     if ui.verbose:
                         openerargs.update({
                             r'loggingfh': ui,
                             r'loggingname': b's',
                             r'loggingopts': {
                                 r'logdata': True,
                                 r'logdataapis': False,
                             },
                         })
                     if ui.debugflag:
                         openerargs[r'loggingopts'][r'logdataapis'] = True
                     # Don't send default headers when in raw mode. This allows us to
                     # bypass most of the behavior of our URL handling code so we can
                     # have near complete control over what's sent on the wire.
                     if opts['peer'] == 'raw':
                         openerargs[r'sendaccept'] = False
                     opener = urlmod.opener(ui, authinfo, **openerargs)
                     if opts['peer'] == 'http2':
                         ui.write(_('creating http peer for wire protocol version 2\n'))
                         # We go through makepeer() because we need an API descriptor for
                         # the peer instance to be useful.
                         with ui.configoverride({
                             ('experimental', 'httppeer.advertise-v2'): True}):
                             if opts['nologhandshake']:
                                 ui.pushbuffer()
                             peer = httppeer.makepeer(ui, path, opener=opener)
                             if opts['nologhandshake']:
                                 ui.popbuffer()
                         if not isinstance(peer, httppeer.httpv2peer):
                             raise error.Abort(_('could not instantiate HTTP peer for '
                                                 'wire protocol version 2'),
                                               hint=_('the server may not have the feature '
                                                      'enabled or is not allowing this '
                                                      'client version'))
                     elif opts['peer'] == 'raw':
                         ui.write(_('using raw connection to peer\n'))
                         peer = None
                     elif opts['peer']:
                         raise error.Abort(_('--peer %s not supported with HTTP peers') %
                                           opts['peer'])
                     else:
                         peer = httppeer.makepeer(ui, path, opener=opener)
                     # We /could/ populate stdin/stdout with sock.makefile()...
                 else:
                     raise error.Abort(_('unsupported connection configuration'))
                 batchedcommands = None
                 # Now perform actions based on the parsed wire language instructions.
                 for action, lines in blocks:
                     if action in ('raw', 'raw+'):
                         if not stdin:
                             raise error.Abort(_('cannot call raw/raw+ on this peer'))
                         # Concatenate the data together.
                         data = ''.join(l.lstrip() for l in lines)
                         data = stringutil.unescapestr(data)
                         stdin.write(data)
                         if action == 'raw+':
                             stdin.flush()
                     elif action == 'flush':
                         if not stdin:
                             raise error.Abort(_('cannot call flush on this peer'))
                         stdin.flush()
                     elif action.startswith('command'):
                         if not peer:
                             raise error.Abort(_('cannot send commands unless peer instance '
                                                 'is available'))
                         command = action.split(' ', 1)[1]
                         args = {}
                         for line in lines:
                             # We need to allow empty values.
                             fields = line.lstrip().split(' ', 1)
                             if len(fields) == 1:
                                 key = fields[0]
                                 value = ''
                             else:
                                 key, value = fields
                             if value.startswith('eval:'):
                                 value = stringutil.evalpythonliteral(value[5:])
                             else:
                                 value = stringutil.unescapestr(value)
                             args[key] = value
                         if batchedcommands is not None:
                             batchedcommands.append((command, args))
                             continue
                         ui.status(_('sending %s command\n') % command)
                         if 'PUSHFILE' in args:
                             with open(args['PUSHFILE'], r'rb') as fh:
                                 del args['PUSHFILE']
                                 res, output = peer._callpush(command, fh,
                                                              **pycompat.strkwargs(args))
                                 ui.status(_('result: %s\n') % stringutil.escapestr(res))
                                 ui.status(_('remote output: %s\n') %
                                           stringutil.escapestr(output))
                         else:
                             with peer.commandexecutor() as e:
                                 res = e.callcommand(command, args).result()
                             if isinstance(res, wireprotov2peer.commandresponse):
                                 val = list(res.cborobjects())
                                 ui.status(_('response: %s\n') %
                                           stringutil.pprint(val, bprefix=True))
                             else:
                                 ui.status(_('response: %s\n') %
                                           stringutil.pprint(res, bprefix=True))
                     elif action == 'batchbegin':
                         if batchedcommands is not None:
                             raise error.Abort(_('nested batchbegin not allowed'))
                         batchedcommands = []
                     elif action == 'batchsubmit':
                         # There is a batching API we could go through. But it would be
                         # difficult to normalize requests into function calls. It is easier
                         # to bypass this layer and normalize to commands + args.
                         ui.status(_('sending batch with %d sub-commands\n') %
                                   len(batchedcommands))
                         for i, chunk in enumerate(peer._submitbatch(batchedcommands)):
                             ui.status(_('response #%d: %s\n') %
                                       (i, stringutil.escapestr(chunk)))
                         batchedcommands = None
                     elif action.startswith('httprequest '):
                         if not opener:
                             raise error.Abort(_('cannot use httprequest without an HTTP '
                                                 'peer'))
                         request = action.split(' ', 2)
                         if len(request) != 3:
                             raise error.Abort(_('invalid httprequest: expected format is '
                                                 '"httprequest <method> <path>'))
                         method, httppath = request[1:]
                         headers = {}
                         body = None
                         frames = []
                         for line in lines:
                             line = line.lstrip()
                             m = re.match(b'^([a-zA-Z0-9_-]+): (.*)$', line)
                             if m:
                                 headers[m.group(1)] = m.group(2)
                                 continue
                             if line.startswith(b'BODYFILE '):
                                 with open(line.split(b' ', 1), 'rb') as fh:
                                     body = fh.read()
                             elif line.startswith(b'frame '):
                                 frame = wireprotoframing.makeframefromhumanstring(
                                     line[len(b'frame '):])
                                 frames.append(frame)
                             else:
                                 raise error.Abort(_('unknown argument to httprequest: %s') %
                                                   line)
                         url = path + httppath
                         if frames:
                             body = b''.join(bytes(f) for f in frames)
                         req = urlmod.urlreq.request(pycompat.strurl(url), body, headers)
                         # urllib.Request insists on using has_data() as a proxy for
                         # determining the request method. Override that to use our
                         # explicitly requested method.
                         req.get_method = lambda: pycompat.sysstr(method)
                         try:
                             res = opener.open(req)
                             body = res.read()
                         except util.urlerr.urlerror as e:
                             # read() method must be called, but only exists in Python 2
                             getattr(e, 'read', lambda: None)()
                             continue
                         if res.headers.get('Content-Type') == 'application/mercurial-cbor':
                             ui.write(_('cbor> %s\n') %
                                      stringutil.pprint(cbor.loads(body), bprefix=True))
                     elif action == 'close':
                         peer.close()
                     elif action == 'readavailable':
                         if not stdout or not stderr:
                             raise error.Abort(_('readavailable not available on this peer'))
                         stdin.close()
                         stdout.read()
                         stderr.read()
                     elif action == 'readline':
                         if not stdout:
                             raise error.Abort(_('readline not available on this peer'))
                         stdout.readline()
                     elif action == 'ereadline':
                         if not stderr:
                             raise error.Abort(_('ereadline not available on this peer'))
                         stderr.readline()
                     elif action.startswith('read '):
                         count = int(action.split(' ', 1)[1])
                         if not stdout:
                             raise error.Abort(_('read not available on this peer'))
                         stdout.read(count)
                     elif action.startswith('eread '):
                         count = int(action.split(' ', 1)[1])
                         if not stderr:
                             raise error.Abort(_('eread not available on this peer'))
                         stderr.read(count)
                     else:
                         raise error.Abort(_('unknown action: %s') % action)
                 if batchedcommands is not None:
                     raise error.Abort(_('unclosed "batchbegin" request'))
                 if peer:
                     peer.close()
                 if proc:
                     proc.kill()

mercurial/revlog.py

0 +9 -700

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             from __future__ import absolute_import
             import collections
             import contextlib
             import errno
             import hashlib
-            import heapq
             import os
             import re
             import struct
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullhex,
                 nullid,
                 nullrev,
                 wdirfilenodeids,
                 wdirhex,
                 wdirid,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
-                LIMIT_DELTA2TEXT,
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_ISCENSORED,
                 REVIDX_KNOWN_FLAGS,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
             )
             from .thirdparty import (
                 attr,
             )
             from . import (
                 ancestor,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 repository,
                 templatefilters,
                 util,
             )
+            from .revlogutils import (
+                deltas as deltautil,
+            )
             from .utils import (
                 interfaceutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_KNOWN_FLAGS
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod(r'parsers')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             AmbiguousPrefixLookupError = error.AmbiguousPrefixLookupError
             CensoredNodeError = error.CensoredNodeError
             ProgrammingError = error.ProgrammingError
             # Store flag processors (cf. 'addflagprocessor()' to register)
             _flagprocessors = {
                 REVIDX_ISCENSORED: None,
             }
             _mdre = re.compile('\1\n')
             def parsemeta(text):
                 """return (metadatadict, metadatasize)"""
                 # text can be buffer, so we can't use .startswith or .index
                 if text[:2] != '\1\n':
                     return None, None
                 s = _mdre.search(text, 2).start()
                 mtext = text[2:s]
                 meta = {}
                 for l in mtext.splitlines():
                     k, v = l.split(": ", 1)
                     meta[k] = v
                 return meta, (s + 2)
             def packmeta(meta, text):
                 keys = sorted(meta)
                 metatext = "".join("%s: %s\n" % (k, meta[k]) for k in keys)
                 return "\1\n%s\1\n%s" % (metatext, text)
             def _censoredtext(text):
                 m, offs = parsemeta(text)
                 return m and "censored" in m
             def addflagprocessor(flag, processor):
                 """Register a flag processor on a revision data flag.
                 Invariant:
                 - Flags need to be defined in REVIDX_KNOWN_FLAGS and REVIDX_FLAGS_ORDER,
                   and REVIDX_RAWTEXT_CHANGING_FLAGS if they can alter rawtext.
                 - Only one flag processor can be registered on a specific flag.
                 - flagprocessors must be 3-tuples of functions (read, write, raw) with the
                   following signatures:
                       - (read)  f(self, rawtext) -> text, bool
                       - (write) f(self, text) -> rawtext, bool
                       - (raw)   f(self, rawtext) -> bool
                   "text" is presented to the user. "rawtext" is stored in revlog data, not
                   directly visible to the user.
                   The boolean returned by these transforms is used to determine whether
                   the returned text can be used for hash integrity checking. For example,
                   if "write" returns False, then "text" is used to generate hash. If
                   "write" returns True, that basically means "rawtext" returned by "write"
                   should be used to generate hash. Usually, "write" and "read" return
                   different booleans. And "raw" returns a same boolean as "write".
                   Note: The 'raw' transform is used for changegroup generation and in some
                   debug commands. In this case the transform only indicates whether the
                   contents can be used for hash integrity checks.
                 """
                 if not flag & REVIDX_KNOWN_FLAGS:
                     msg = _("cannot register processor on unknown flag '%#x'.") % (flag)
                     raise ProgrammingError(msg)
                 if flag not in REVIDX_FLAGS_ORDER:
                     msg = _("flag '%#x' undefined in REVIDX_FLAGS_ORDER.") % (flag)
                     raise ProgrammingError(msg)
                 if flag in _flagprocessors:
                     msg = _("cannot register multiple processors on flag '%#x'.") % (flag)
                     raise error.Abort(msg)
                 _flagprocessors[flag] = processor
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 if (type & ~REVIDX_KNOWN_FLAGS) != 0:
                     raise ValueError('unknown revlog index flags')
                 return int(int(offset) << 16 | type)
             _nullhash = hashlib.sha1(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = _nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     if p1 < p2:
                         a = p1
                         b = p2
                     else:
                         a = p2
                         b = p1
                     s = hashlib.sha1(a)
                     s.update(b)
                 s.update(text)
                 return s.digest()
-            class _testrevlog(object):
-                """minimalist fake revlog to use in doctests"""
-                def __init__(self, data, density=0.5, mingap=0):
-                    """data is an list of revision payload boundaries"""
-                    self._data = data
-                    self._srdensitythreshold = density
-                    self._srmingapsize = mingap
-                def start(self, rev):
-                    if rev == 0:
-                        return 0
-                    return self._data[rev - 1]
-                def end(self, rev):
-                    return self._data[rev]
-                def length(self, rev):
-                    return self.end(rev) - self.start(rev)
-                def __len__(self):
-                    return len(self._data)
-            def _trimchunk(revlog, revs, startidx, endidx=None):
-                """returns revs[startidx:endidx] without empty trailing revs
-                Doctest Setup
-                >>> revlog = _testrevlog([
-                ...  5,  #0
-                ...  10, #1
-                ...  12, #2
-                ...  12, #3 (empty)
-                ...  17, #4
-                ...  21, #5
-                ...  21, #6 (empty)
-                ... ])
-                Contiguous cases:
-                >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0)
-                [0, 1, 2, 3, 4, 5]
-                >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 5)
-                [0, 1, 2, 3, 4]
-                >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 4)
-                [0, 1, 2]
-                >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 2, 4)
-                [2]
-                >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3)
-                [3, 4, 5]
-                >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3, 5)
-                [3, 4]
-                Discontiguous cases:
-                >>> _trimchunk(revlog, [1, 3, 5, 6], 0)
-                [1, 3, 5]
-                >>> _trimchunk(revlog, [1, 3, 5, 6], 0, 2)
-                [1]
-                >>> _trimchunk(revlog, [1, 3, 5, 6], 1, 3)
-                [3, 5]
-                >>> _trimchunk(revlog, [1, 3, 5, 6], 1)
-                [3, 5]
-                """
-                length = revlog.length
-                if endidx is None:
-                    endidx = len(revs)
-                # If we have a non-emtpy delta candidate, there are nothing to trim
-                if revs[endidx - 1] < len(revlog):
-                    # Trim empty revs at the end, except the very first revision of a chain
-                    while (endidx > 1
-                            and endidx > startidx
-                            and length(revs[endidx - 1]) == 0):
-                        endidx -= 1
-                return revs[startidx:endidx]
-            def _segmentspan(revlog, revs, deltainfo=None):
-                """Get the byte span of a segment of revisions
-                revs is a sorted array of revision numbers
-                >>> revlog = _testrevlog([
-                ...  5,  #0
-                ...  10, #1
-                ...  12, #2
-                ...  12, #3 (empty)
-                ...  17, #4
-                ... ])
-                >>> _segmentspan(revlog, [0, 1, 2, 3, 4])
-                >>> _segmentspan(revlog, [0, 4])
-                >>> _segmentspan(revlog, [3, 4])
-                >>> _segmentspan(revlog, [1, 2, 3,])
-                >>> _segmentspan(revlog, [1, 3])
-                """
-                if not revs:
-                    return 0
-                if deltainfo is not None and len(revlog) <= revs[-1]:
-                    if len(revs) == 1:
-                        return deltainfo.deltalen
-                    offset = revlog.end(len(revlog) - 1)
-                    end = deltainfo.deltalen + offset
-                else:
-                    end = revlog.end(revs[-1])
-                return end - revlog.start(revs[0])
-            def _slicechunk(revlog, revs, deltainfo=None, targetsize=None):
-                """slice revs to reduce the amount of unrelated data to be read from disk.
-                ``revs`` is sliced into groups that should be read in one time.
-                Assume that revs are sorted.
-                The initial chunk is sliced until the overall density (payload/chunks-span
-                ratio) is above `revlog._srdensitythreshold`. No gap smaller than
-                `revlog._srmingapsize` is skipped.
-                If `targetsize` is set, no chunk larger than `targetsize` will be yield.
-                For consistency with other slicing choice, this limit won't go lower than
-                `revlog._srmingapsize`.
-                If individual revisions chunk are larger than this limit, they will still
-                be raised individually.
-                >>> revlog = _testrevlog([
-                ...  5,  #00 (5)
-                ...  10, #01 (5)
-                ...  12, #02 (2)
-                ...  12, #03 (empty)
-                ...  27, #04 (15)
-                ...  31, #05 (4)
-                ...  31, #06 (empty)
-                ...  42, #07 (11)
-                ...  47, #08 (5)
-                ...  47, #09 (empty)
-                ...  48, #10 (1)
-                ...  51, #11 (3)
-                ...  74, #12 (23)
-                ...  85, #13 (11)
-                ...  86, #14 (1)
-                ...  91, #15 (5)
-                ... ])
-                >>> list(_slicechunk(revlog, list(range(16))))
-                [[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
-                >>> list(_slicechunk(revlog, [0, 15]))
-                [[0], [15]]
-                >>> list(_slicechunk(revlog, [0, 11, 15]))
-                [[0], [11], [15]]
-                >>> list(_slicechunk(revlog, [0, 11, 13, 15]))
-                [[0], [11, 13, 15]]
-                >>> list(_slicechunk(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
-                [[1, 2], [5, 8, 10, 11], [14]]
-                Slicing with a maximum chunk size
-                >>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=15))
-                [[0], [11], [13], [15]]
-                >>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=20))
-                [[0], [11], [13, 15]]
-                """
-                if targetsize is not None:
-                    targetsize = max(targetsize, revlog._srmingapsize)
-                # targetsize should not be specified when evaluating delta candidates:
-                # * targetsize is used to ensure we stay within specification when reading,
-                # * deltainfo is used to pick are good delta chain when writing.
-                if not (deltainfo is None or targetsize is None):
-                    msg = 'cannot use `targetsize` with a `deltainfo`'
-                    raise error.ProgrammingError(msg)
-                for chunk in _slicechunktodensity(revlog, revs,
-                                                  deltainfo,
-                                                  revlog._srdensitythreshold,
-                                                  revlog._srmingapsize):
-                    for subchunk in _slicechunktosize(revlog, chunk, targetsize):
-                        yield subchunk
-            def _slicechunktosize(revlog, revs, targetsize=None):
-                """slice revs to match the target size
-                This is intended to be used on chunk that density slicing selected by that
-                are still too large compared to the read garantee of revlog. This might
-                happens when "minimal gap size" interrupted the slicing or when chain are
-                built in a way that create large blocks next to each other.
-                >>> revlog = _testrevlog([
-                ...  3,  #0 (3)
-                ...  5,  #1 (2)
-                ...  6,  #2 (1)
-                ...  8,  #3 (2)
-                ...  8,  #4 (empty)
-                ...  11, #5 (3)
-                ...  12, #6 (1)
-                ...  13, #7 (1)
-                ...  14, #8 (1)
-                ... ])
-                Cases where chunk is already small enough
-                >>> list(_slicechunktosize(revlog, [0], 3))
-                [[0]]
-                >>> list(_slicechunktosize(revlog, [6, 7], 3))
-                [[6, 7]]
-                >>> list(_slicechunktosize(revlog, [0], None))
-                [[0]]
-                >>> list(_slicechunktosize(revlog, [6, 7], None))
-                [[6, 7]]
-                cases where we need actual slicing
-                >>> list(_slicechunktosize(revlog, [0, 1], 3))
-                [[0], [1]]
-                >>> list(_slicechunktosize(revlog, [1, 3], 3))
-                [[1], [3]]
-                >>> list(_slicechunktosize(revlog, [1, 2, 3], 3))
-                [[1, 2], [3]]
-                >>> list(_slicechunktosize(revlog, [3, 5], 3))
-                [[3], [5]]
-                >>> list(_slicechunktosize(revlog, [3, 4, 5], 3))
-                [[3], [5]]
-                >>> list(_slicechunktosize(revlog, [5, 6, 7, 8], 3))
-                [[5], [6, 7, 8]]
-                >>> list(_slicechunktosize(revlog, [0, 1, 2, 3, 4, 5, 6, 7, 8], 3))
-                [[0], [1, 2], [3], [5], [6, 7, 8]]
-                Case with too large individual chunk (must return valid chunk)
-                >>> list(_slicechunktosize(revlog, [0, 1], 2))
-                [[0], [1]]
-                >>> list(_slicechunktosize(revlog, [1, 3], 1))
-                [[1], [3]]
-                >>> list(_slicechunktosize(revlog, [3, 4, 5], 2))
-                [[3], [5]]
-                """
-                assert targetsize is None or 0 <= targetsize
-                if targetsize is None or _segmentspan(revlog, revs) <= targetsize:
-                    yield revs
-                    return
-                startrevidx = 0
-                startdata = revlog.start(revs[0])
-                endrevidx = 0
-                iterrevs = enumerate(revs)
-                next(iterrevs) # skip first rev.
-                for idx, r in iterrevs:
-                    span = revlog.end(r) - startdata
-                    if span <= targetsize:
-                        endrevidx = idx
-                    else:
-                        chunk = _trimchunk(revlog, revs, startrevidx, endrevidx + 1)
-                        if chunk:
-                            yield chunk
-                        startrevidx = idx
-                        startdata = revlog.start(r)
-                        endrevidx = idx
-                yield _trimchunk(revlog, revs, startrevidx)
-            def _slicechunktodensity(revlog, revs, deltainfo=None, targetdensity=0.5,
-                                     mingapsize=0):
-                """slice revs to reduce the amount of unrelated data to be read from disk.
-                ``revs`` is sliced into groups that should be read in one time.
-                Assume that revs are sorted.
-                ``deltainfo`` is a _deltainfo instance of a revision that we would append
-                to the top of the revlog.
-                The initial chunk is sliced until the overall density (payload/chunks-span
-                ratio) is above `targetdensity`. No gap smaller than `mingapsize` is
-                skipped.
-                >>> revlog = _testrevlog([
-                ...  5,  #00 (5)
-                ...  10, #01 (5)
-                ...  12, #02 (2)
-                ...  12, #03 (empty)
-                ...  27, #04 (15)
-                ...  31, #05 (4)
-                ...  31, #06 (empty)
-                ...  42, #07 (11)
-                ...  47, #08 (5)
-                ...  47, #09 (empty)
-                ...  48, #10 (1)
-                ...  51, #11 (3)
-                ...  74, #12 (23)
-                ...  85, #13 (11)
-                ...  86, #14 (1)
-                ...  91, #15 (5)
-                ... ])
-                >>> list(_slicechunktodensity(revlog, list(range(16))))
-                [[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
-                >>> list(_slicechunktodensity(revlog, [0, 15]))
-                [[0], [15]]
-                >>> list(_slicechunktodensity(revlog, [0, 11, 15]))
-                [[0], [11], [15]]
-                >>> list(_slicechunktodensity(revlog, [0, 11, 13, 15]))
-                [[0], [11, 13, 15]]
-                >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
-                [[1, 2], [5, 8, 10, 11], [14]]
-                >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
-                ...                           mingapsize=20))
-                [[1, 2, 3, 5, 8, 10, 11], [14]]
-                >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
-                ...                           targetdensity=0.95))
-                [[1, 2], [5], [8, 10, 11], [14]]
-                >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
-                ...                           targetdensity=0.95, mingapsize=12))
-                [[1, 2], [5, 8, 10, 11], [14]]
-                """
-                start = revlog.start
-                length = revlog.length
-                if len(revs) <= 1:
-                    yield revs
-                    return
-                nextrev = len(revlog)
-                nextoffset = revlog.end(nextrev - 1)
-                if deltainfo is None:
-                    deltachainspan = _segmentspan(revlog, revs)
-                    chainpayload = sum(length(r) for r in revs)
-                else:
-                    deltachainspan = deltainfo.distance
-                    chainpayload = deltainfo.compresseddeltalen
-                if deltachainspan < mingapsize:
-                    yield revs
-                    return
-                readdata = deltachainspan
-                if deltachainspan:
-                    density = chainpayload / float(deltachainspan)
-                else:
-                    density = 1.0
-                if density >= targetdensity:
-                    yield revs
-                    return
-                if deltainfo is not None and deltainfo.deltalen:
-                    revs = list(revs)
-                    revs.append(nextrev)
-                # Store the gaps in a heap to have them sorted by decreasing size
-                gapsheap = []
-                heapq.heapify(gapsheap)
-                prevend = None
-                for i, rev in enumerate(revs):
-                    if rev < nextrev:
-                        revstart = start(rev)
-                        revlen = length(rev)
-                    else:
-                        revstart = nextoffset
-                        revlen = deltainfo.deltalen
-                    # Skip empty revisions to form larger holes
-                    if revlen == 0:
-                        continue
-                    if prevend is not None:
-                        gapsize = revstart - prevend
-                        # only consider holes that are large enough
-                        if gapsize > mingapsize:
-                            heapq.heappush(gapsheap, (-gapsize, i))
-                    prevend = revstart + revlen
-                # Collect the indices of the largest holes until the density is acceptable
-                indicesheap = []
-                heapq.heapify(indicesheap)
-                while gapsheap and density < targetdensity:
-                    oppgapsize, gapidx = heapq.heappop(gapsheap)
-                    heapq.heappush(indicesheap, gapidx)
-                    # the gap sizes are stored as negatives to be sorted decreasingly
-                    # by the heap
-                    readdata -= (-oppgapsize)
-                    if readdata > 0:
-                        density = chainpayload / float(readdata)
-                    else:
-                        density = 1.0
-                # Cut the revs at collected indices
-                previdx = 0
-                while indicesheap:
-                    idx = heapq.heappop(indicesheap)
-                    chunk = _trimchunk(revlog, revs, previdx, idx)
-                    if chunk:
-                        yield chunk
-                    previdx = idx
-                chunk = _trimchunk(revlog, revs, previdx)
-                if chunk:
-                    yield chunk
-            @attr.s(slots=True, frozen=True)
-            class _deltainfo(object):
-                distance = attr.ib()
-                deltalen = attr.ib()
-                data = attr.ib()
-                base = attr.ib()
-                chainbase = attr.ib()
-                chainlen = attr.ib()
-                compresseddeltalen = attr.ib()
-                snapshotdepth = attr.ib()
-            class _deltacomputer(object):
-                def __init__(self, revlog):
-                    self.revlog = revlog
-                def _getcandidaterevs(self, p1, p2, cachedelta):
-                    """
-                    Provides revisions that present an interest to be diffed against,
-                    grouped by level of easiness.
-                    """
-                    revlog = self.revlog
-                    gdelta = revlog._generaldelta
-                    curr = len(revlog)
-                    prev = curr - 1
-                    p1r, p2r = revlog.rev(p1), revlog.rev(p2)
-                    # should we try to build a delta?
-                    if prev != nullrev and revlog._storedeltachains:
-                        tested = set()
-                        # This condition is true most of the time when processing
-                        # changegroup data into a generaldelta repo. The only time it
-                        # isn't true is if this is the first revision in a delta chain
-                        # or if ``format.generaldelta=true`` disabled ``lazydeltabase``.
-                        if cachedelta and gdelta and revlog._lazydeltabase:
-                            # Assume what we received from the server is a good choice
-                            # build delta will reuse the cache
-                            yield (cachedelta[0],)
-                            tested.add(cachedelta[0])
-                        if gdelta:
-                            # exclude already lazy tested base if any
-                            parents = [p for p in (p1r, p2r)
-                                       if p != nullrev and p not in tested]
-                            if not revlog._deltabothparents and len(parents) == 2:
-                                parents.sort()
-                                # To minimize the chance of having to build a fulltext,
-                                # pick first whichever parent is closest to us (max rev)
-                                yield (parents[1],)
-                                # then the other one (min rev) if the first did not fit
-                                yield (parents[0],)
-                                tested.update(parents)
-                            elif len(parents) > 0:
-                                # Test all parents (1 or 2), and keep the best candidate
-                                yield parents
-                                tested.update(parents)
-                        if prev not in tested:
-                            # other approach failed try against prev to hopefully save us a
-                            # fulltext.
-                            yield (prev,)
-                            tested.add(prev)
-                def buildtext(self, revinfo, fh):
-                    """Builds a fulltext version of a revision
-                    revinfo: _revisioninfo instance that contains all needed info
-                    fh:      file handle to either the .i or the .d revlog file,
-                             depending on whether it is inlined or not
-                    """
-                    btext = revinfo.btext
-                    if btext[0] is not None:
-                        return btext[0]
-                    revlog = self.revlog
-                    cachedelta = revinfo.cachedelta
-                    flags = revinfo.flags
-                    node = revinfo.node
-                    baserev = cachedelta[0]
-                    delta = cachedelta[1]
-                    # special case deltas which replace entire base; no need to decode
-                    # base revision. this neatly avoids censored bases, which throw when
-                    # they're decoded.
-                    hlen = struct.calcsize(">lll")
-                    if delta[:hlen] == mdiff.replacediffheader(revlog.rawsize(baserev),
-                                                               len(delta) - hlen):
-                        btext[0] = delta[hlen:]
-                    else:
-                        # deltabase is rawtext before changed by flag processors, which is
-                        # equivalent to non-raw text
-                        basetext = revlog.revision(baserev, _df=fh, raw=False)
-                        btext[0] = mdiff.patch(basetext, delta)
-                    try:
-                        res = revlog._processflags(btext[0], flags, 'read', raw=True)
-                        btext[0], validatehash = res
-                        if validatehash:
-                            revlog.checkhash(btext[0], node, p1=revinfo.p1, p2=revinfo.p2)
-                        if flags & REVIDX_ISCENSORED:
-                            raise RevlogError(_('node %s is not censored') % node)
-                    except CensoredNodeError:
-                        # must pass the censored index flag to add censored revisions
-                        if not flags & REVIDX_ISCENSORED:
-                            raise
-                    return btext[0]
-                def _builddeltadiff(self, base, revinfo, fh):
-                    revlog = self.revlog
-                    t = self.buildtext(revinfo, fh)
-                    if revlog.iscensored(base):
-                        # deltas based on a censored revision must replace the
-                        # full content in one patch, so delta works everywhere
-                        header = mdiff.replacediffheader(revlog.rawsize(base), len(t))
-                        delta = header + t
-                    else:
-                        ptext = revlog.revision(base, _df=fh, raw=True)
-                        delta = mdiff.textdiff(ptext, t)
-                    return delta
-                def _builddeltainfo(self, revinfo, base, fh):
-                    # can we use the cached delta?
-                    if revinfo.cachedelta and revinfo.cachedelta[0] == base:
-                        delta = revinfo.cachedelta[1]
-                    else:
-                        delta = self._builddeltadiff(base, revinfo, fh)
-                    revlog = self.revlog
-                    header, data = revlog.compress(delta)
-                    deltalen = len(header) + len(data)
-                    chainbase = revlog.chainbase(base)
-                    offset = revlog.end(len(revlog) - 1)
-                    dist = deltalen + offset - revlog.start(chainbase)
-                    if revlog._generaldelta:
-                        deltabase = base
-                    else:
-                        deltabase = chainbase
-                    chainlen, compresseddeltalen = revlog._chaininfo(base)
-                    chainlen += 1
-                    compresseddeltalen += deltalen
-                    revlog = self.revlog
-                    snapshotdepth = None
-                    if deltabase == nullrev:
-                        snapshotdepth = 0
-                    elif revlog._sparserevlog and revlog.issnapshot(deltabase):
-                        # A delta chain should always be one full snapshot,
-                        # zero or more semi-snapshots, and zero or more deltas
-                        p1, p2 = revlog.rev(revinfo.p1), revlog.rev(revinfo.p2)
-                        if deltabase not in (p1, p2) and revlog.issnapshot(deltabase):
-                            snapshotdepth = len(revlog._deltachain(deltabase)[0])
-                    return _deltainfo(dist, deltalen, (header, data), deltabase,
-                                      chainbase, chainlen, compresseddeltalen,
-                                      snapshotdepth)
-                def finddeltainfo(self, revinfo, fh):
-                    """Find an acceptable delta against a candidate revision
-                    revinfo: information about the revision (instance of _revisioninfo)
-                    fh:      file handle to either the .i or the .d revlog file,
-                             depending on whether it is inlined or not
-                    Returns the first acceptable candidate revision, as ordered by
-                    _getcandidaterevs
-                    """
-                    if not revinfo.textlen:
-                        return None # empty file do not need delta
-                    cachedelta = revinfo.cachedelta
-                    p1 = revinfo.p1
-                    p2 = revinfo.p2
-                    revlog = self.revlog
-                    deltalength = self.revlog.length
-                    deltaparent = self.revlog.deltaparent
-                    deltainfo = None
-                    deltas_limit = revinfo.textlen * LIMIT_DELTA2TEXT
-                    for candidaterevs in self._getcandidaterevs(p1, p2, cachedelta):
-                        # filter out delta base that will never produce good delta
-                        candidaterevs = [r for r in candidaterevs
-                                         if self.revlog.length(r) <= deltas_limit]
-                        nominateddeltas = []
-                        for candidaterev in candidaterevs:
-                            # skip over empty delta (no need to include them in a chain)
-                            while candidaterev != nullrev and not deltalength(candidaterev):
-                                candidaterev = deltaparent(candidaterev)
-                            # no need to try a delta against nullid, this will be handled
-                            # by fulltext later.
-                            if candidaterev == nullrev:
-                                continue
-                            # no delta for rawtext-changing revs (see "candelta" for why)
-                            if revlog.flags(candidaterev) & REVIDX_RAWTEXT_CHANGING_FLAGS:
-                                continue
-                            candidatedelta = self._builddeltainfo(revinfo, candidaterev, fh)
-                            if revlog._isgooddeltainfo(candidatedelta, revinfo):
-                                nominateddeltas.append(candidatedelta)
-                        if nominateddeltas:
-                            deltainfo = min(nominateddeltas, key=lambda x: x.deltalen)
-                            break
-                    return deltainfo
             @attr.s(slots=True, frozen=True)
             class _revisioninfo(object):
                 """Information about a revision that allows building its fulltext
                 node:       expected hash of the revision
                 p1, p2:     parent revs of the revision
                 btext:      built text cache consisting of a one-element list
                 cachedelta: (baserev, uncompressed_delta) or None
                 flags:      flags associated to the revision storage
                 One of btext[0] or cachedelta must be set.
                 """
                 node = attr.ib()
                 p1 = attr.ib()
                 p2 = attr.ib()
                 btext = attr.ib()
                 textlen = attr.ib()
                 cachedelta = attr.ib()
                 flags = attr.ib()
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True, frozen=True)
             class revlogrevisiondelta(object):
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 linknode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
             # index v0:
             #  4 bytes: offset
             #  4 bytes: compressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             # 20 bytes: parent 1 nodeid
             # 20 bytes: parent 2 nodeid
             # 20 bytes: nodeid
             indexformatv0 = struct.Struct(">4l20s20s20s")
             indexformatv0_pack = indexformatv0.pack
             indexformatv0_unpack = indexformatv0.unpack
             class revlogoldindex(list):
                 def __getitem__(self, i):
                     if i == -1:
                         return (0, 0, 0, -1, -1, -1, -1, nullid)
                     return list.__getitem__(self, i)
             class revlogoldio(object):
                 def __init__(self):
                     self.size = indexformatv0.size
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap = {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = indexformatv0_unpack(cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     return revlogoldindex(index), nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_('index entry flags need revlog version 1'))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return indexformatv0_pack(*e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = struct.Struct(">Qiiiiii20s12x")
             indexformatng_pack = indexformatng.pack
             versionformat = struct.Struct(">I")
             versionformat_pack = versionformat.pack
             versionformat_unpack = versionformat.unpack
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7fffffff
             class revlogio(object):
                 def __init__(self):
                     self.size = indexformatng.size
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, getattr(index, 'nodemap', None), cache
                 def packentry(self, entry, node, version, rev):
                     p = indexformatng_pack(*entry)
                     if rev == 0:
                         p = versionformat_pack(version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 """
                 def __init__(self, opener, indexfile, datafile=None, checkambig=False,
                              mmaplargeindex=False, censorable=False):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = datafile or (indexfile[:-2] + ".d")
                     self.opener = opener
                     #  When True, indexfile is opened with checkambig=True at writing, to
                     #  avoid file stat ambiguity.
                     self._checkambig = checkambig
                     self._censorable = censorable
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._cache = None
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     # 2-tuple of (offset, data) of raw data from the revlog at an offset.
                     self._chunkcache = (0, '')
                     # How much data to read and cache into the raw revlog data cache.
                     self._chunkcachesize = 65536
                     self._maxchainlen = None
                     self._deltabothparents = True
                     self.index = []
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # Mapping of revision integer to full node.
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     self._compengine = 'zlib'
                     self._maxdeltachainspan = -1
                     self._withsparseread = False
                     self._sparserevlog = False
                     self._srdensitythreshold = 0.50
                     self._srmingapsize = 262144
                     mmapindexthreshold = None
                     v = REVLOG_DEFAULT_VERSION
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         if 'revlogv2' in opts:
                             # version 2 revlogs always use generaldelta.
                             v = REVLOGV2 | FLAG_GENERALDELTA | FLAG_INLINE_DATA
                         elif 'revlogv1' in opts:
                             if 'generaldelta' in opts:
                                 v |= FLAG_GENERALDELTA
                         else:
                             v = 0
                         if 'chunkcachesize' in opts:
                             self._chunkcachesize = opts['chunkcachesize']
                         if 'maxchainlen' in opts:
                             self._maxchainlen = opts['maxchainlen']
                         if 'deltabothparents' in opts:
                             self._deltabothparents = opts['deltabothparents']
                         self._lazydeltabase = bool(opts.get('lazydeltabase', False))
                         if 'compengine' in opts:
                             self._compengine = opts['compengine']
                         if 'maxdeltachainspan' in opts:
                             self._maxdeltachainspan = opts['maxdeltachainspan']
                         if mmaplargeindex and 'mmapindexthreshold' in opts:
                             mmapindexthreshold = opts['mmapindexthreshold']
                         self._sparserevlog = bool(opts.get('sparse-revlog', False))
                         withsparseread = bool(opts.get('with-sparse-read', False))
                         # sparse-revlog forces sparse-read
                         self._withsparseread = self._sparserevlog or withsparseread
                         if 'sparse-read-density-threshold' in opts:
                             self._srdensitythreshold = opts['sparse-read-density-threshold']
                         if 'sparse-read-min-gap-size' in opts:
                             self._srmingapsize = opts['sparse-read-min-gap-size']
                     if self._chunkcachesize <= 0:
                         raise RevlogError(_('revlog chunk cache size %r is not greater '
                                             'than 0') % self._chunkcachesize)
                     elif self._chunkcachesize & (self._chunkcachesize - 1):
                         raise RevlogError(_('revlog chunk cache size %r is not a power '
                                             'of 2') % self._chunkcachesize)
                     indexdata = ''
                     self._initempty = True
                     try:
                         with self._indexfp() as f:
                             if (mmapindexthreshold is not None and
                                     self.opener.fstat(f).st_size >= mmapindexthreshold):
                                 indexdata = util.buffer(util.mmapread(f))
                             else:
                                 indexdata = f.read()
                         if len(indexdata) > 0:
                             v = versionformat_unpack(indexdata[:4])[0]
                             self._initempty = False
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & FLAG_INLINE_DATA
                     self._generaldelta = v & FLAG_GENERALDELTA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0:
                         if flags:
                             raise RevlogError(_('unknown flags (%#04x) in version %d '
                                                 'revlog %s') %
                                               (flags >> 16, fmt, self.indexfile))
                     elif fmt == REVLOGV1:
                         if flags & ~REVLOGV1_FLAGS:
                             raise RevlogError(_('unknown flags (%#04x) in version %d '
                                                 'revlog %s') %
                                               (flags >> 16, fmt, self.indexfile))
                     elif fmt == REVLOGV2:
                         if flags & ~REVLOGV2_FLAGS:
                             raise RevlogError(_('unknown flags (%#04x) in version %d '
                                                 'revlog %s') %
                                               (flags >> 16, fmt, self.indexfile))
                     else:
                         raise RevlogError(_('unknown version (%d) in revlog %s') %
                                           (fmt, self.indexfile))
                     self._storedeltachains = True
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(indexdata, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = {}
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                 @util.propertycache
                 def _compressor(self):
                     return util.compengines[self._compengine].revlogcompressor()
                 def _indexfp(self, mode='r'):
                     """file object for the revlog's index file"""
                     args = {r'mode': mode}
                     if mode != 'r':
                         args[r'checkambig'] = self._checkambig
                     if mode == 'w':
                         args[r'atomictemp'] = True
                     return self.opener(self.indexfile, **args)
                 def _datafp(self, mode='r'):
                     """file object for the revlog's data file"""
                     return self.opener(self.datafile, mode=mode)
                 @contextlib.contextmanager
                 def _datareadfp(self, existingfp=None):
                     """file object suitable to read data"""
                     if existingfp is not None:
                         yield existingfp
                     else:
                         if self._inline:
                             func = self._indexfp
                         else:
                             func = self._datafp
                         with func() as fp:
                             yield fp
                 def tip(self):
                     return self.node(len(self.index) - 1)
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(pycompat.xrange(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     step = 1
                     length = len(self)
                     if stop is not None:
                         if start > stop:
                             step = -1
                         stop += step
                         if stop > length:
                             stop = length
                     else:
                         stop = length
                     return pycompat.xrange(start, stop, step)
                 @util.propertycache
                 def nodemap(self):
                     if self.index:
                         # populate mapping down to the initial node
                         node0 = self.index[0][7]  # get around changelog filtering
                         self.rev(node0)
                     return self._nodecache
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if ((self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS)
                         or (self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS)):
                         return False
                     return True
                 def clearcaches(self):
                     self._cache = None
                     self._chainbasecache.clear()
                     self._chunkcache = (0, '')
                     self._pcache = {}
                     try:
                         self._nodecache.clearcaches()
                     except AttributeError:
                         self._nodecache = {nullid: nullrev}
                         self._nodepos = None
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except TypeError:
                         raise
                     except RevlogError:
                         # parsers.c radix tree lookup failed
                         if node == wdirid or node in wdirfilenodeids:
                             raise error.WdirUnsupported
                         raise LookupError(node, self.indexfile, _('no node'))
                     except KeyError:
                         # pure python cache lookup failed
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 1
                         else:
                             assert p < len(i)
                         for r in pycompat.xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         if node == wdirid or node in wdirfilenodeids:
                             raise error.WdirUnsupported
                         raise LookupError(node, self.indexfile, _('no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(rev, raw=True)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev, raw=False))
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     return entry[5], entry[6]
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, self._generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,
                                                   inclusive=inclusive)
                 def descendants(self, revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in self.revs(start=first + 1):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset(object):
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     try:
                         return self.index.headrevs()
                     except AttributeError:
                         return self._headrevs()
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = {startrev}
                     heads = {startrev}
                     parentrevs = self.parentrevs
                     for r in self.revs(start=startrev + 1):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError): # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     commonancestorsheads is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return a in self._commonancestorsheads(a, b)
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if "%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = wdirhex.startswith(id)
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 raise RevlogError
                             return partial
                         if maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         return None
                     except RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             raise AmbiguousPrefixLookupError(id, self.indexfile,
                                                              _('ambiguous identifier'))
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key was too short to search radix tree
                         pass
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id) and
                                   self.hasnode(n)]
                             if nullhex.startswith(id):
                                 nl.append(nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise AmbiguousPrefixLookupError(id, self.indexfile,
                                                                  _('ambiguous identifier'))
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             node = self._partialmatch(prefix)
                         except error.RevlogError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if node is None:
                             raise LookupError(node, self.indexfile, _('no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == 'f' for c in prefix)
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, 41):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except RevlogError:
                             if node != wdirid:
                                 raise LookupError(node, self.indexfile, _('no node'))
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == wdirid:
                         for length in range(minlength, 41):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, 41):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _cachesegment(self, offset, data):
                     """Add a segment to the revlog cache.
                     Accepts an absolute offset and the data that is at that location.
                     """
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _readsegment(self, offset, length, df=None):
                     """Load a segment of raw data from the revlog.
                     Accepts an absolute offset, length to read, and an optional existing
                     file handle to read from.
                     If an existing file handle is passed, it will be seeked and the
                     original seek position will NOT be restored.
                     Returns a str or buffer of raw byte data.
                     """
                     # Cache data both forward and backward around the requested
                     # data, in a fixed size window. This helps speed up operations
                     # involving reading the revlog backwards.
                     cachesize = self._chunkcachesize
                     realoffset = offset & ~(cachesize - 1)
                     reallength = (((offset + length + cachesize) & ~(cachesize - 1))
                                   - realoffset)
                     with self._datareadfp(df) as df:
                         df.seek(realoffset)
                         d = df.read(reallength)
                     self._cachesegment(realoffset, d)
                     if offset != realoffset or reallength != length:
                         return util.buffer(d, offset - realoffset, length)
                     return d
                 def _getsegment(self, offset, length, df=None):
                     """Obtain a segment of raw data from the revlog.
                     Accepts an absolute offset, length of bytes to obtain, and an
                     optional file handle to the already-opened revlog. If the file
                     handle is used, it's original seek position will not be preserved.
                     Requests for data may be returned from a cache.
                     Returns a str or a buffer instance of raw byte data.
                     """
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return util.buffer(d, cachestart, cacheend - cachestart)
                     return self._readsegment(offset, length, df=df)
                 def _getsegmentforrevs(self, startrev, endrev, df=None):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                         end += (endrev + 1) * self._io.size
                     length = end - start
                     return start, self._getsegment(start, length, df=df)
                 def _chunk(self, rev, df=None):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])
                 def _chunks(self, revs, df=None, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self._io.size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     if not self._withsparseread:
                         slicedchunks = (revs,)
                     else:
-                        slicedchunks = _slicechunk(self, revs, targetsize=targetsize)
+                        slicedchunks = deltautil.slicechunk(self, revs,
+                                                            targetsize=targetsize)
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             return [self._chunk(rev, df=df) for rev in revschunk]
                         decomp = self.decompress
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             ladd(decomp(buffer(data, chunkstart - offset, chunklength)))
                     return l
                 def _chunkclear(self):
                     """Clear the raw chunk cache."""
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot
                     """
                     if rev == nullrev:
                         return True
                     deltap = self.deltaparent(rev)
                     if deltap == nullrev:
                         return True
                     p1, p2 = self.parentrevs(rev)
                     if deltap in (p1, p2):
                         return False
                     return self.issnapshot(deltap)
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise ProgrammingError('revision %d not a snapshot')
                     return len(self._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._chunk(rev2))
                     return mdiff.textdiff(self.revision(rev1, raw=True),
                                           self.revision(rev2, raw=True))
                 def revision(self, nodeorrev, _df=None, raw=False):
                     """return an uncompressed revision of a given node or revision
                     number.
                     _df - an existing file handle to read from. (internal-only)
                     raw - an optional argument specifying if the revision data is to be
                     treated as raw data when applying flag transforms. 'raw' should be set
                     to True when generating changegroups or in debug commands.
                     """
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     cachedrev = None
                     flags = None
                     rawtext = None
                     if node == nullid:
                         return ""
                     if self._cache:
                         if self._cache[0] == node:
                             # _cache only stores rawtext
                             if raw:
                                 return self._cache[2]
                             # duplicated, but good for perf
                             if rev is None:
                                 rev = self.rev(node)
                             if flags is None:
                                 flags = self.flags(rev)
                             # no extra flags set, no flag processor runs, text = rawtext
                             if flags == REVIDX_DEFAULT_FLAGS:
                                 return self._cache[2]
                             # rawtext is reusable. need to run flag processor
                             rawtext = self._cache[2]
                         cachedrev = self._cache[1]
                     # look up what we need to read
                     if rawtext is None:
                         if rev is None:
                             rev = self.rev(node)
                         chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                         if stopped:
                             rawtext = self._cache[2]
                         # drop cache to save memory
                         self._cache = None
                         targetsize = None
                         rawsize = self.index[rev][2]
                         if 0 <= rawsize:
                             targetsize = 4 * rawsize
                         bins = self._chunks(chain, df=_df, targetsize=targetsize)
                         if rawtext is None:
                             rawtext = bytes(bins[0])
                             bins = bins[1:]
                         rawtext = mdiff.patches(rawtext, bins)
                         self._cache = (node, rev, rawtext)
                     if flags is None:
                         if rev is None:
                             rev = self.rev(node)
                         flags = self.flags(rev)
                     text, validatehash = self._processflags(rawtext, flags, 'read', raw=raw)
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     return text
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return hash(text, p1, p2)
                 def _processflags(self, text, flags, operation, raw=False):
                     """Inspect revision data flags and applies transforms defined by
                     registered flag processors.
                     ``text`` - the revision data to process
                     ``flags`` - the revision flags
                     ``operation`` - the operation being performed (read or write)
                     ``raw`` - an optional argument describing if the raw transform should be
                     applied.
                     This method processes the flags in the order (or reverse order if
                     ``operation`` is 'write') defined by REVIDX_FLAGS_ORDER, applying the
                     flag processors registered for present flags. The order of flags defined
                     in REVIDX_FLAGS_ORDER needs to be stable to allow non-commutativity.
                     Returns a 2-tuple of ``(text, validatehash)`` where ``text`` is the
                     processed text and ``validatehash`` is a bool indicating whether the
                     returned text should be checked for hash integrity.
                     Note: If the ``raw`` argument is set, it has precedence over the
                     operation and will only update the value of ``validatehash``.
                     """
                     # fast path: no flag processors will run
                     if flags == 0:
                         return text, True
                     if not operation in ('read', 'write'):
                         raise ProgrammingError(_("invalid '%s' operation ") % (operation))
                     # Check all flags are known.
                     if flags & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_("incompatible revision flag '%#x'") %
                                           (flags & ~REVIDX_KNOWN_FLAGS))
                     validatehash = True
                     # Depending on the operation (read or write), the order might be
                     # reversed due to non-commutative transforms.
                     orderedflags = REVIDX_FLAGS_ORDER
                     if operation == 'write':
                         orderedflags = reversed(orderedflags)
                     for flag in orderedflags:
                         # If a flagprocessor has been registered for a known flag, apply the
                         # related operation transform and update result tuple.
                         if flag & flags:
                             vhash = True
                             if flag not in _flagprocessors:
                                 message = _("missing processor for flag '%#x'") % (flag)
                                 raise RevlogError(message)
                             processor = _flagprocessors[flag]
                             if processor is not None:
                                 readtransform, writetransform, rawtransform = processor
                                 if raw:
                                     vhash = rawtransform(self, text)
                                 elif operation == 'read':
                                     text, vhash = readtransform(self, text)
                                 else: # write operation
                                     text, vhash = writetransform(self, text)
                             validatehash = validatehash and vhash
                     return text, validatehash
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise RevlogError(_("integrity check failed on %s:%s")
                                 % (self.indexfile, pycompat.bytestr(revornode)))
                     except RevlogError:
                         if self._censorable and _censoredtext(text):
                             raise error.CensoredNodeError(self.indexfile, node, text)
                         raise
                 def _enforceinlinesize(self, tr, fp=None):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     if (not self._inline or
                         (self.start(tiprev) + self.length(tiprev)) < _maxinline):
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     if trindex is not None:
                         dataoff = self.start(trindex)
                     else:
                         # revlog was stripped at start of transaction, use all leftover data
                         trindex = len(self) - 1
                         dataoff = self.end(tiprev)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     with self._datafp('w') as df:
                         for r in self:
                             df.write(self._getsegmentforrevs(r, r)[1])
                     with self._indexfp('w') as fp:
                         self.version &= ~FLAG_INLINE_DATA
                         self._inline = False
                         io = self._io
                         for i in self:
                             e = io.packentry(self.index[i], self.node, self.version, i)
                             fp.write(e)
                         # the temp file replace the real index when we exit the context
                         # manager
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
                                 node=None, flags=REVIDX_DEFAULT_FLAGS, deltacomputer=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
-                    deltacomputer - an optional _deltacomputer instance shared between
+                    deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise RevlogError(_("attempted to add linkrev -1 to %s")
                                           % self.indexfile)
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = self._processflags(text, flags, 'write')
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise RevlogError(
                             _("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")
                             % (self.indexfile, len(rawtext)))
                     node = node or self.hash(rawtext, p1, p2)
                     if node in self.nodemap:
                         return node
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(rawtext, transaction, link, p1, p2, node,
                                                flags, cachedelta=cachedelta,
                                                deltacomputer=deltacomputer)
                 def addrawrevision(self, rawtext, transaction, link, p1, p2, node, flags,
                                    cachedelta=None, deltacomputer=None):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     dfh = None
                     if not self._inline:
                         dfh = self._datafp("a+")
                     ifh = self._indexfp("a+")
                     try:
                         return self._addrevision(node, rawtext, transaction, link, p1, p2,
                                                  flags, cachedelta, ifh, dfh,
                                                  deltacomputer=deltacomputer)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return '', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return '', compressed
                     if data[0:1] == '\0':
                         return '', data
                     return 'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == 'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise RevlogError(_('revlog decompress error: %s') %
                                               stringutil.forcebytestr(e))
                     # '\0' is more common than 'u' so it goes first.
                     elif t == '\0':
                         return data
                     elif t == 'u':
                         return util.buffer(data, 1)
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor()
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise RevlogError(_('unknown compression type %r') % t)
                     return compressor.decompress(data)
-                def _isgooddeltainfo(self, deltainfo, revinfo):
-                    """Returns True if the given delta is good. Good means that it is within
-                    the disk span, disk size, and chain length bounds that we know to be
-                    performant."""
-                    if deltainfo is None:
-                        return False
-                    # - 'deltainfo.distance' is the distance from the base revision --
-                    #   bounding it limits the amount of I/O we need to do.
-                    # - 'deltainfo.compresseddeltalen' is the sum of the total size of
-                    #   deltas we need to apply -- bounding it limits the amount of CPU
-                    #   we consume.
-                    if self._sparserevlog:
-                        # As sparse-read will be used, we can consider that the distance,
-                        # instead of being the span of the whole chunk,
-                        # is the span of the largest read chunk
-                        base = deltainfo.base
-                        if base != nullrev:
-                            deltachain = self._deltachain(base)[0]
-                        else:
-                            deltachain = []
-                        # search for the first non-snapshot revision
-                        for idx, r in enumerate(deltachain):
-                            if not self.issnapshot(r):
-                                break
-                        deltachain = deltachain[idx:]
-                        chunks = _slicechunk(self, deltachain, deltainfo)
-                        all_span = [_segmentspan(self, revs, deltainfo) for revs in chunks]
-                        distance = max(all_span)
-                    else:
-                        distance = deltainfo.distance
-                    textlen = revinfo.textlen
-                    defaultmax = textlen * 4
-                    maxdist = self._maxdeltachainspan
-                    if not maxdist:
-                        maxdist = distance # ensure the conditional pass
-                    maxdist = max(maxdist, defaultmax)
-                    if self._sparserevlog and maxdist < self._srmingapsize:
-                        # In multiple place, we are ignoring irrelevant data range below a
-                        # certain size. Be also apply this tradeoff here and relax span
-                        # constraint for small enought content.
-                        maxdist = self._srmingapsize
-                    # Bad delta from read span:
-                    #   If the span of data read is larger than the maximum allowed.
-                    if maxdist < distance:
-                        return False
-                    # Bad delta from new delta size:
-                    #   If the delta size is larger than the target text, storing the
-                    #   delta will be inefficient.
-                    if textlen < deltainfo.deltalen:
-                        return False
-                    # Bad delta from cumulated payload size:
-                    #   If the sum of delta get larger than K * target text length.
-                    if textlen * LIMIT_DELTA2TEXT < deltainfo.compresseddeltalen:
-                        return False
-                    # Bad delta from chain length:
-                    #   If the number of delta in the chain gets too high.
-                    if self._maxchainlen and  self._maxchainlen < deltainfo.chainlen:
-                        return False
-                    # bad delta from intermediate snapshot size limit
-                    #   If an intermediate snapshot size is higher than the limit.  The
-                    #   limit exist to prevent endless chain of intermediate delta to be
-                    #   created.
-                    if (deltainfo.snapshotdepth is not None and
-                            (textlen >> deltainfo.snapshotdepth) < deltainfo.deltalen):
-                        return False
-                    # bad delta if new intermediate snapshot is larger than the previous
-                    # snapshot
-                    if (deltainfo.snapshotdepth
-                            and self.length(deltainfo.base) < deltainfo.deltalen):
-                        return False
-                    return True
                 def _addrevision(self, node, rawtext, transaction, link, p1, p2, flags,
                                  cachedelta, ifh, dfh, alwayscache=False,
                                  deltacomputer=None):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == nullid:
                         raise RevlogError(_("%s: attempt to add null revision") %
                                           (self.indexfile))
                     if node == wdirid or node in wdirfilenodeids:
                         raise RevlogError(_("%s: attempt to add wdir revision") %
                                           (self.indexfile))
                     if self._inline:
                         fh = ifh
                     else:
                         fh = dfh
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self.end(prev)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(revlog.size(self, cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
-                        deltacomputer = _deltacomputer(self)
+                        deltacomputer = deltautil.deltacomputer(self)
                     revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)
                     # no delta for flag processor revision (see "candelta" for why)
                     # not calling candelta since only one revision needs test, also to
                     # avoid overhead fetching flags again.
                     if flags & REVIDX_RAWTEXT_CHANGING_FLAGS:
                         deltainfo = None
                     else:
                         deltainfo = deltacomputer.finddeltainfo(revinfo, fh)
                     if deltainfo is not None:
                         base = deltainfo.base
                         chainbase = deltainfo.chainbase
                         data = deltainfo.data
                         l = deltainfo.deltalen
                     else:
                         rawtext = deltacomputer.buildtext(revinfo, fh)
                         data = self.compress(rawtext)
                         l = len(data[1]) + len(data[0])
                         base = chainbase = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.append(e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo, fh)
                     if type(rawtext) == bytes: # only accept immutable objects
                         self._cache = (node, curr, rawtext)
                     self._chainbasecache[curr] = chainbase
                     return node
                 def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3.
                     ifh.seek(0, os.SEEK_END)
                     if dfh:
                         dfh.seek(0, os.SEEK_END)
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self._enforceinlinesize(transaction, ifh)
                 def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     nodes = []
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self._indexfp("a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self._datafp("a+")
                     def flush():
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                     try:
-                        deltacomputer = _deltacomputer(self)
+                        deltacomputer = deltautil.deltacomputer(self)
                         # loop through our set of deltas
                         for data in deltas:
                             node, p1, p2, linknode, deltabase, delta, flags = data
                             link = linkmapper(linknode)
                             flags = flags or REVIDX_DEFAULT_FLAGS
                             nodes.append(node)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 continue
                             for p in (p1, p2):
                                 if p not in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             if baserev != nullrev and self.iscensored(baserev):
                                 # if base is censored, delta must be full replacement in a
                                 # single patch operation
                                 hlen = struct.calcsize(">lll")
                                 oldlen = self.rawsize(baserev)
                                 newlen = len(delta) - hlen
                                 if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
                                     raise error.CensoredBaseError(self.indexfile,
                                                                   self.node(baserev))
                             if not flags and self._peek_iscensored(baserev, delta, flush):
                                 flags |= REVIDX_ISCENSORED
                             # We assume consumers of addrevisioncb will want to retrieve
                             # the added revision, which will require a call to
                             # revision(). revision() will fast path if there is a cache
                             # hit. So, we tell _addrevision() to always cache in this case.
                             # We're only using addgroup() in the context of changegroup
                             # generation so the revision data can always be handled as raw
                             # by the flagprocessor.
                             self._addrevision(node, None, transaction, link,
                                               p1, p2, flags, (baserev, delta),
                                               ifh, dfh,
                                               alwayscache=bool(addrevisioncb),
                                               deltacomputer=deltacomputer)
                             if addrevisioncb:
                                 addrevisioncb(self, node)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self._datafp("a+")
                                 ifh = self._indexfp("a+")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return nodes
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self._censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta, flush):
                     """Quickly check if a delta produces a censored revision."""
                     if not self._censorable:
                         return False
                     # Fragile heuristic: unless new file meta keys are added alphabetically
                     # preceding "censored", all censored revisions are prefixed by
                     # "\1\ncensored:". A delta producing such a censored revision must be a
                     # full-replacement delta, so we inspect the first and only patch in the
                     # delta for this prefix.
                     hlen = struct.calcsize(">lll")
                     if len(delta) <= hlen:
                         return False
                     oldlen = self.rawsize(baserev)
                     newlen = len(delta) - hlen
                     if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
                         return False
                     add = "\1\ncensored:"
                     addlen = len(add)
                     return newlen >= addlen and delta[hlen:hlen + addlen] == add
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     brokenrevs = set()
                     strippoint = len(self)
                     heads = {}
                     futurelargelinkrevs = set()
                     for head in self.headrevs():
                         headlinkrev = self.linkrev(head)
                         heads[head] = headlinkrev
                         if headlinkrev >= minlink:
                             futurelargelinkrevs.add(headlinkrev)
                     # This algorithm involves walking down the rev graph, starting at the
                     # heads. Since the revs are topologically sorted according to linkrev,
                     # once all head linkrevs are below the minlink, we know there are
                     # no more revs that could have a linkrev greater than minlink.
                     # So we can stop walking.
                     while futurelargelinkrevs:
                         strippoint -= 1
                         linkrev = heads.pop(strippoint)
                         if linkrev < minlink:
                             brokenrevs.add(strippoint)
                         else:
                             futurelargelinkrevs.remove(linkrev)
                         for p in self.parentrevs(strippoint):
                             if p != nullrev:
                                 plinkrev = self.linkrev(p)
                                 heads[p] = plinkrev
                                 if plinkrev >= minlink:
                                     futurelargelinkrevs.add(plinkrev)
                     return strippoint, brokenrevs
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chaininfocache = {}
                     self._chunkclear()
                     for x in pycompat.xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                     self._nodepos = None
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, 2)
                             actual = f.tell()
                         dd = actual - expected
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res
                 def emitrevisiondeltas(self, requests):
                     frev = self.rev
                     prevrev = None
                     for request in requests:
                         node = request.node
                         rev = frev(node)
                         if prevrev is None:
                             prevrev = self.index[rev][5]
                         # Requesting a full revision.
                         if request.basenode == nullid:
                             baserev = nullrev
                         # Requesting an explicit revision.
                         elif request.basenode is not None:
                             baserev = frev(request.basenode)
                         # Allowing us to choose.
                         else:
                             p1rev, p2rev = self.parentrevs(rev)
                             deltaparentrev = self.deltaparent(rev)
                             # Avoid sending full revisions when delta parent is null. Pick
                             # prev in that case. It's tempting to pick p1 in this case, as
                             # p1 will be smaller in the common case. However, computing a
                             # delta against p1 may require resolving the raw text of p1,
                             # which could be expensive. The revlog caches should have prev
                             # cached, meaning less CPU for delta generation. There is
                             # likely room to add a flag and/or config option to control this
                             # behavior.
                             if deltaparentrev == nullrev and self._storedeltachains:
                                 baserev = prevrev
                             # Revlog is configured to use full snapshot for a reason.
                             # Stick to full snapshot.
                             elif deltaparentrev == nullrev:
                                 baserev = nullrev
                             # Pick previous when we can't be sure the base is available
                             # on consumer.
                             elif deltaparentrev not in (p1rev, p2rev, prevrev):
                                 baserev = prevrev
                             else:
                                 baserev = deltaparentrev
                             if baserev != nullrev and not self.candelta(baserev, rev):
                                 baserev = nullrev
                         revision = None
                         delta = None
                         baserevisionsize = None
                         if self.iscensored(baserev) or self.iscensored(rev):
                             try:
                                 revision = self.revision(node, raw=True)
                             except error.CensoredNodeError as e:
                                 revision = e.tombstone
                             if baserev != nullrev:
                                 baserevisionsize = self.rawsize(baserev)
                         elif baserev == nullrev:
                             revision = self.revision(node, raw=True)
                         else:
                             delta = self.revdiff(baserev, rev)
                         extraflags = REVIDX_ELLIPSIS if request.ellipsis else 0
                         yield revlogrevisiondelta(
                             node=node,
                             p1node=request.p1node,
                             p2node=request.p2node,
                             linknode=request.linknode,
                             basenode=self.node(baserev),
                             flags=self.flags(rev) | extraflags,
                             baserevisionsize=baserevisionsize,
                             revision=revision,
                             delta=delta)
                         prevrev = rev
                 DELTAREUSEALWAYS = 'always'
                 DELTAREUSESAMEREVS = 'samerevs'
                 DELTAREUSENEVER = 'never'
                 DELTAREUSEFULLADD = 'fulladd'
                 DELTAREUSEALL = {'always', 'samerevs', 'never', 'fulladd'}
                 def clone(self, tr, destrevlog, addrevisioncb=None,
                           deltareuse=DELTAREUSESAMEREVS, deltabothparents=None):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``deltabothparents`` argument
                     controls whether to compute deltas against both parents for merges.
                     By default, the current default is used.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(_('value for deltareuse invalid: %s') % deltareuse)
                     if len(destrevlog):
                         raise ValueError(_('destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_('source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_('destination revlog has filtered revisions'))
                     # lazydeltabase controls whether to reuse a cached delta, if possible.
                     oldlazydeltabase = destrevlog._lazydeltabase
                     oldamd = destrevlog._deltabothparents
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog._lazydeltabase = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog._lazydeltabase = False
                         destrevlog._deltabothparents = deltabothparents or oldamd
                         populatecachedelta = deltareuse in (self.DELTAREUSEALWAYS,
                                                             self.DELTAREUSESAMEREVS)
-                        deltacomputer = _deltacomputer(destrevlog)
+                        deltacomputer = deltautil.deltacomputer(destrevlog)
                         index = self.index
                         for rev in self:
                             entry = index[rev]
                             # Some classes override linkrev to take filtered revs into
                             # account. Use raw entry from index.
                             flags = entry[0] & 0xffff
                             linkrev = entry[4]
                             p1 = index[entry[5]][7]
                             p2 = index[entry[6]][7]
                             node = entry[7]
                             # (Possibly) reuse the delta from the revlog if allowed and
                             # the revlog chunk is a delta.
                             cachedelta = None
                             rawtext = None
                             if populatecachedelta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._chunk(rev)))
                             if not cachedelta:
                                 rawtext = self.revision(rev, raw=True)
                             if deltareuse == self.DELTAREUSEFULLADD:
                                 destrevlog.addrevision(rawtext, tr, linkrev, p1, p2,
                                                        cachedelta=cachedelta,
                                                        node=node, flags=flags,
                                                        deltacomputer=deltacomputer)
                             else:
                                 ifh = destrevlog.opener(destrevlog.indexfile, 'a+',
                                                         checkambig=False)
                                 dfh = None
                                 if not destrevlog._inline:
                                     dfh = destrevlog.opener(destrevlog.datafile, 'a+')
                                 try:
                                     destrevlog._addrevision(node, rawtext, tr, linkrev, p1,
                                                             p2, flags, cachedelta, ifh, dfh,
                                                             deltacomputer=deltacomputer)
                                 finally:
                                     if dfh:
                                         dfh.close()
                                     ifh.close()
                             if addrevisioncb:
                                 addrevisioncb(self, rev, node)
                     finally:
                         destrevlog._lazydeltabase = oldlazydeltabase
                         destrevlog._deltabothparents = oldamd

mercurial/revlogutils/constants.py

0 0 -3

             # revlogdeltas.py - constant used for revlog logic
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             # Copyright 2018 Octobus <contact@octobus.net>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Helper class to compute deltas stored inside revlogs"""
             from __future__ import absolute_import
             from .. import (
                 util,
             )
             # revlog header flags
             REVLOGV0 = 0
             REVLOGV1 = 1
             # Dummy value until file format is finalized.
             # Reminder: change the bounds check in revlog.__init__ when this is changed.
             REVLOGV2 = 0xDEAD
             FLAG_INLINE_DATA = (1 << 16)
             FLAG_GENERALDELTA = (1 << 17)
             REVLOG_DEFAULT_FLAGS = FLAG_INLINE_DATA
             REVLOG_DEFAULT_FORMAT = REVLOGV1
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGV1_FLAGS = FLAG_INLINE_DATA | FLAG_GENERALDELTA
             REVLOGV2_FLAGS = REVLOGV1_FLAGS
             # revlog index flags
             REVIDX_ISCENSORED = (1 << 15) # revision has censor metadata, must be verified
             REVIDX_ELLIPSIS = (1 << 14) # revision hash does not match data (narrowhg)
             REVIDX_EXTSTORED = (1 << 13) # revision data is stored externally
             REVIDX_DEFAULT_FLAGS = 0
             # stable order in which flags need to be processed and their processors applied
             REVIDX_FLAGS_ORDER = [
                 REVIDX_ISCENSORED,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
             ]
             REVIDX_KNOWN_FLAGS = util.bitsfrom(REVIDX_FLAGS_ORDER)
             # bitmark for flags that could cause rawdata content change
             REVIDX_RAWTEXT_CHANGING_FLAGS = REVIDX_ISCENSORED | REVIDX_EXTSTORED
-            # maximum <delta-chain-data>/<revision-text-length> ratio
-            LIMIT_DELTA2TEXT = 2

mercurial/revlogutils/deltas.py mercurial/revlog.py

0 copied +204 -2650

This diff has been collapsed as it changes many lines, (2854 lines changed) Show them Hide them
	@@ -1,3180 +1,734 b''
	1	# revlog.py - storage back-end for mercurial	1	# revlogdeltas.py - Logic around delta computation for revlog
	2	#	2	#
	3	# Copyright 2005-2007 Matt Mackall <mpm@selenic.com>	3	# Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
			4	# Copyright 2018 Octobus <contact@octobus.net>
	4	#	5	#
	5	# This software may be used and distributed according to the terms of the	6	# This software may be used and distributed according to the terms of the
	6	# GNU General Public License version 2 or any later version.	7	# GNU General Public License version 2 or any later version.
	7		8	"""Helper class to compute deltas stored inside revlogs"""
	8	"""Storage back-end for Mercurial.
	9
	10	This provides efficient delta storage with O(1) retrieve and append
	11	and O(changes) merge between branches.
	12	"""
	13		9
	14	from __future__ import absolute_import	10	from __future__ import absolute_import
	15		11
	16	import collections
	17	import contextlib
	18	import errno
	19	import hashlib
	20	import heapq	12	import heapq
	21	import os
	22	import re
	23	import struct	13	import struct
	24	import zlib
	25		14
	26	# import stuff from node for others to import from revlog	15	# import stuff from node for others to import from revlog
	27	from .node import (	16	from ..node import (
	28	bin,
	29	hex,
	30	nullhex,
	31	nullid,
	32	nullrev,	17	nullrev,
	33	wdirfilenodeids,
	34	wdirhex,
	35	wdirid,
	36	wdirrev,
	37	)	18	)
	38	from .i18n import _	19	from ..i18n import _
	39	from .revlogutils.constants import (	20
	40	FLAG_GENERALDELTA,	21	from .constants import (
	41	FLAG_INLINE_DATA,
	42	LIMIT_DELTA2TEXT,
	43	REVIDX_DEFAULT_FLAGS,
	44	REVIDX_ELLIPSIS,
	45	REVIDX_EXTSTORED,
	46	REVIDX_FLAGS_ORDER,
	47	REVIDX_ISCENSORED,	22	REVIDX_ISCENSORED,
	48	REVIDX_KNOWN_FLAGS,
	49	REVIDX_RAWTEXT_CHANGING_FLAGS,	23	REVIDX_RAWTEXT_CHANGING_FLAGS,
	50	REVLOGV0,
	51	REVLOGV1,
	52	REVLOGV1_FLAGS,
	53	REVLOGV2,
	54	REVLOGV2_FLAGS,
	55	REVLOG_DEFAULT_FLAGS,
	56	REVLOG_DEFAULT_FORMAT,
	57	REVLOG_DEFAULT_VERSION,
	58	)	24	)
	59	from .thirdparty import (	25
			26	from ..thirdparty import (
	60	attr,	27	attr,
	61	)	28	)
	62	from . import (	29
	63	ancestor,	30	from .. import (
	64	error,	31	error,
	65	mdiff,	32	mdiff,
	66	policy,
	67	pycompat,
	68	repository,
	69	templatefilters,
	70	util,
	71	)	33	)
	72	from .utils import (
	73	interfaceutil,
	74	stringutil,
	75	)
	76
	77	# blanked usage of all the name to prevent pyflakes constraints
	78	# We need these name available in the module for extensions.
	79	REVLOGV0
	80	REVLOGV1
	81	REVLOGV2
	82	FLAG_INLINE_DATA
	83	FLAG_GENERALDELTA
	84	REVLOG_DEFAULT_FLAGS
	85	REVLOG_DEFAULT_FORMAT
	86	REVLOG_DEFAULT_VERSION
	87	REVLOGV1_FLAGS
	88	REVLOGV2_FLAGS
	89	REVIDX_ISCENSORED
	90	REVIDX_ELLIPSIS
	91	REVIDX_EXTSTORED
	92	REVIDX_DEFAULT_FLAGS
	93	REVIDX_FLAGS_ORDER
	94	REVIDX_KNOWN_FLAGS
	95	REVIDX_RAWTEXT_CHANGING_FLAGS
	96
	97	parsers = policy.importmod(r'parsers')
	98
	99	# Aliased for performance.
	100	_zlibdecompress = zlib.decompress
	101
	102	# max size of revlog with inline data
	103	_maxinline = 131072
	104	_chunksize = 1048576
	105		34
	106	RevlogError = error.RevlogError	35	RevlogError = error.RevlogError
	107	LookupError = error.LookupError
	108	AmbiguousPrefixLookupError = error.AmbiguousPrefixLookupError
	109	CensoredNodeError = error.CensoredNodeError	36	CensoredNodeError = error.CensoredNodeError
	110	ProgrammingError = error.ProgrammingError
	111
	112	# Store flag processors (cf. 'addflagprocessor()' to register)
	113	_flagprocessors = {
	114	REVIDX_ISCENSORED: None,
	115	}
	116
	117	_mdre = re.compile('\1\n')
	118	def parsemeta(text):
	119	"""return (metadatadict, metadatasize)"""
	120	# text can be buffer, so we can't use .startswith or .index
	121	if text[:2] != '\1\n':
	122	return None, None
	123	s = _mdre.search(text, 2).start()
	124	mtext = text[2:s]
	125	meta = {}
	126	for l in mtext.splitlines():
	127	k, v = l.split(": ", 1)
	128	meta[k] = v
	129	return meta, (s + 2)
	130
	131	def packmeta(meta, text):
	132	keys = sorted(meta)
	133	metatext = "".join("%s: %s\n" % (k, meta[k]) for k in keys)
	134	return "\1\n%s\1\n%s" % (metatext, text)
	135
	136	def _censoredtext(text):
	137	m, offs = parsemeta(text)
	138	return m and "censored" in m
	139
	140	def addflagprocessor(flag, processor):
	141	"""Register a flag processor on a revision data flag.
	142		37
	143	Invariant:	38	# maximum <delta-chain-data>/<revision-text-length> ratio
	144	- Flags need to be defined in REVIDX_KNOWN_FLAGS and REVIDX_FLAGS_ORDER,	39	LIMIT_DELTA2TEXT = 2
	145	and REVIDX_RAWTEXT_CHANGING_FLAGS if they can alter rawtext.
	146	- Only one flag processor can be registered on a specific flag.
	147	- flagprocessors must be 3-tuples of functions (read, write, raw) with the
	148	following signatures:
	149	- (read) f(self, rawtext) -> text, bool
	150	- (write) f(self, text) -> rawtext, bool
	151	- (raw) f(self, rawtext) -> bool
	152	"text" is presented to the user. "rawtext" is stored in revlog data, not
	153	directly visible to the user.
	154	The boolean returned by these transforms is used to determine whether
	155	the returned text can be used for hash integrity checking. For example,
	156	if "write" returns False, then "text" is used to generate hash. If
	157	"write" returns True, that basically means "rawtext" returned by "write"
	158	should be used to generate hash. Usually, "write" and "read" return
	159	different booleans. And "raw" returns a same boolean as "write".
	160
	161	Note: The 'raw' transform is used for changegroup generation and in some
	162	debug commands. In this case the transform only indicates whether the
	163	contents can be used for hash integrity checks.
	164	"""
	165	if not flag & REVIDX_KNOWN_FLAGS:
	166	msg = _("cannot register processor on unknown flag '%#x'.") % (flag)
	167	raise ProgrammingError(msg)
	168	if flag not in REVIDX_FLAGS_ORDER:
	169	msg = _("flag '%#x' undefined in REVIDX_FLAGS_ORDER.") % (flag)
	170	raise ProgrammingError(msg)
	171	if flag in _flagprocessors:
	172	msg = _("cannot register multiple processors on flag '%#x'.") % (flag)
	173	raise error.Abort(msg)
	174	_flagprocessors[flag] = processor
	175
	176	def getoffset(q):
	177	return int(q >> 16)
	178
	179	def gettype(q):
	180	return int(q & 0xFFFF)
	181
	182	def offset_type(offset, type):
	183	if (type & ~REVIDX_KNOWN_FLAGS) != 0:
	184	raise ValueError('unknown revlog index flags')
	185	return int(int(offset) << 16 \| type)
	186
	187	_nullhash = hashlib.sha1(nullid)
	188
	189	def hash(text, p1, p2):
	190	"""generate a hash from the given text and its parent hashes
	191
	192	This hash combines both the current file contents and its history
	193	in a manner that makes it easy to distinguish nodes with the same
	194	content in the revision graph.
	195	"""
	196	# As of now, if one of the parent node is null, p2 is null
	197	if p2 == nullid:
	198	# deep copy of a hash is faster than creating one
	199	s = _nullhash.copy()
	200	s.update(p1)
	201	else:
	202	# none of the parent nodes are nullid
	203	if p1 < p2:
	204	a = p1
	205	b = p2
	206	else:
	207	a = p2
	208	b = p1
	209	s = hashlib.sha1(a)
	210	s.update(b)
	211	s.update(text)
	212	return s.digest()
	213		40
	214	class _testrevlog(object):	41	class _testrevlog(object):
	215	"""minimalist fake revlog to use in doctests"""	42	"""minimalist fake revlog to use in doctests"""
	216		43
	217	def __init__(self, data, density=0.5, mingap=0):	44	def __init__(self, data, density=0.5, mingap=0):
	218	"""data is an list of revision payload boundaries"""	45	"""data is an list of revision payload boundaries"""
	219	self._data = data	46	self._data = data
	220	self._srdensitythreshold = density	47	self._srdensitythreshold = density
	221	self._srmingapsize = mingap	48	self._srmingapsize = mingap
	222		49
	223	def start(self, rev):	50	def start(self, rev):
	224	if rev == 0:	51	if rev == 0:
	225	return 0	52	return 0
	226	return self._data[rev - 1]	53	return self._data[rev - 1]
	227		54
	228	def end(self, rev):	55	def end(self, rev):
	229	return self._data[rev]	56	return self._data[rev]
	230		57
	231	def length(self, rev):	58	def length(self, rev):
	232	return self.end(rev) - self.start(rev)	59	return self.end(rev) - self.start(rev)
	233		60
	234	def __len__(self):	61	def __len__(self):
	235	return len(self._data)	62	return len(self._data)
	236		63
	237	def ~~_trim~~chunk(revlog, revs, ~~startidx~~, ~~endidx~~=None):	64	def slicechunk(revlog, revs, deltainfo=None, targetsize=None):
	238	"""returns revs[startidx:endidx] without empty trailing revs
	239
	240	Doctest Setup
	241	>>> revlog = _testrevlog([
	242	... 5, #0
	243	... 10, #1
	244	... 12, #2
	245	... 12, #3 (empty)
	246	... 17, #4
	247	... 21, #5
	248	... 21, #6 (empty)
	249	... ])
	250
	251	Contiguous cases:
	252	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0)
	253	[0, 1, 2, 3, 4, 5]
	254	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 5)
	255	[0, 1, 2, 3, 4]
	256	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 4)
	257	[0, 1, 2]
	258	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 2, 4)
	259	[2]
	260	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3)
	261	[3, 4, 5]
	262	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3, 5)
	263	[3, 4]
	264
	265	Discontiguous cases:
	266	>>> _trimchunk(revlog, [1, 3, 5, 6], 0)
	267	[1, 3, 5]
	268	>>> _trimchunk(revlog, [1, 3, 5, 6], 0, 2)
	269	[1]
	270	>>> _trimchunk(revlog, [1, 3, 5, 6], 1, 3)
	271	[3, 5]
	272	>>> _trimchunk(revlog, [1, 3, 5, 6], 1)
	273	[3, 5]
	274	"""
	275	length = revlog.length
	276
	277	if endidx is None:
	278	endidx = len(revs)
	279
	280	# If we have a non-emtpy delta candidate, there are nothing to trim
	281	if revs[endidx - 1] < len(revlog):
	282	# Trim empty revs at the end, except the very first revision of a chain
	283	while (endidx > 1
	284	and endidx > startidx
	285	and length(revs[endidx - 1]) == 0):
	286	endidx -= 1
	287
	288	return revs[startidx:endidx]
	289
	290	def _segmentspan(revlog, revs, deltainfo=None):
	291	"""Get the byte span of a segment of revisions
	292
	293	revs is a sorted array of revision numbers
	294
	295	>>> revlog = _testrevlog([
	296	... 5, #0
	297	... 10, #1
	298	... 12, #2
	299	... 12, #3 (empty)
	300	... 17, #4
	301	... ])
	302
	303	>>> _segmentspan(revlog, [0, 1, 2, 3, 4])
	304	17
	305	>>> _segmentspan(revlog, [0, 4])
	306	17
	307	>>> _segmentspan(revlog, [3, 4])
	308	5
	309	>>> _segmentspan(revlog, [1, 2, 3,])
	310	7
	311	>>> _segmentspan(revlog, [1, 3])
	312	7
	313	"""
	314	if not revs:
	315	return 0
	316	if deltainfo is not None and len(revlog) <= revs[-1]:
	317	if len(revs) == 1:
	318	return deltainfo.deltalen
	319	offset = revlog.end(len(revlog) - 1)
	320	end = deltainfo.deltalen + offset
	321	else:
	322	end = revlog.end(revs[-1])
	323	return end - revlog.start(revs[0])
	324
	325	def _slicechunk(revlog, revs, deltainfo=None, targetsize=None):
	326	"""slice revs to reduce the amount of unrelated data to be read from disk.	65	"""slice revs to reduce the amount of unrelated data to be read from disk.
	327		66
	328	``revs`` is sliced into groups that should be read in one time.	67	``revs`` is sliced into groups that should be read in one time.
	329	Assume that revs are sorted.	68	Assume that revs are sorted.
	330		69
	331	The initial chunk is sliced until the overall density (payload/chunks-span	70	The initial chunk is sliced until the overall density (payload/chunks-span
	332	ratio) is above `revlog._srdensitythreshold`. No gap smaller than	71	ratio) is above `revlog._srdensitythreshold`. No gap smaller than
	333	`revlog._srmingapsize` is skipped.	72	`revlog._srmingapsize` is skipped.
	334		73
	335	If `targetsize` is set, no chunk larger than `targetsize` will be yield.	74	If `targetsize` is set, no chunk larger than `targetsize` will be yield.
	336	For consistency with other slicing choice, this limit won't go lower than	75	For consistency with other slicing choice, this limit won't go lower than
	337	`revlog._srmingapsize`.	76	`revlog._srmingapsize`.
	338		77
	339	If individual revisions chunk are larger than this limit, they will still	78	If individual revisions chunk are larger than this limit, they will still
	340	be raised individually.	79	be raised individually.
	341		80
	342	>>> revlog = _testrevlog([	81	>>> revlog = _testrevlog([
	343	... 5, #00 (5)	82	... 5, #00 (5)
	344	... 10, #01 (5)	83	... 10, #01 (5)
	345	... 12, #02 (2)	84	... 12, #02 (2)
	346	... 12, #03 (empty)	85	... 12, #03 (empty)
	347	... 27, #04 (15)	86	... 27, #04 (15)
	348	... 31, #05 (4)	87	... 31, #05 (4)
	349	... 31, #06 (empty)	88	... 31, #06 (empty)
	350	... 42, #07 (11)	89	... 42, #07 (11)
	351	... 47, #08 (5)	90	... 47, #08 (5)
	352	... 47, #09 (empty)	91	... 47, #09 (empty)
	353	... 48, #10 (1)	92	... 48, #10 (1)
	354	... 51, #11 (3)	93	... 51, #11 (3)
	355	... 74, #12 (23)	94	... 74, #12 (23)
	356	... 85, #13 (11)	95	... 85, #13 (11)
	357	... 86, #14 (1)	96	... 86, #14 (1)
	358	... 91, #15 (5)	97	... 91, #15 (5)
	359	... ])	98	... ])
	360		99
	361	>>> list(_slicechunk(revlog, list(range(16))))	100	>>> list(slicechunk(revlog, list(range(16))))
	362	[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]	101	[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
	363	>>> list(_slicechunk(revlog, [0, 15]))	102	>>> list(slicechunk(revlog, [0, 15]))
	364	[[0], [15]]	103	[[0], [15]]
	365	>>> list(_slicechunk(revlog, [0, 11, 15]))	104	>>> list(slicechunk(revlog, [0, 11, 15]))
	366	[[0], [11], [15]]	105	[[0], [11], [15]]
	367	>>> list(_slicechunk(revlog, [0, 11, 13, 15]))	106	>>> list(slicechunk(revlog, [0, 11, 13, 15]))
	368	[[0], [11, 13, 15]]	107	[[0], [11, 13, 15]]
	369	>>> list(_slicechunk(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))	108	>>> list(slicechunk(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
	370	[[1, 2], [5, 8, 10, 11], [14]]	109	[[1, 2], [5, 8, 10, 11], [14]]
	371		110
	372	Slicing with a maximum chunk size	111	Slicing with a maximum chunk size
	373	>>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=15))	112	>>> list(slicechunk(revlog, [0, 11, 13, 15], targetsize=15))
	374	[[0], [11], [13], [15]]	113	[[0], [11], [13], [15]]
	375	>>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=20))	114	>>> list(slicechunk(revlog, [0, 11, 13, 15], targetsize=20))
	376	[[0], [11], [13, 15]]	115	[[0], [11], [13, 15]]
	377	"""	116	"""
	378	if targetsize is not None:	117	if targetsize is not None:
	379	targetsize = max(targetsize, revlog._srmingapsize)	118	targetsize = max(targetsize, revlog._srmingapsize)
	380	# targetsize should not be specified when evaluating delta candidates:	119	# targetsize should not be specified when evaluating delta candidates:
	381	# * targetsize is used to ensure we stay within specification when reading,	120	# * targetsize is used to ensure we stay within specification when reading,
	382	# * deltainfo is used to pick are good delta chain when writing.	121	# * deltainfo is used to pick are good delta chain when writing.
	383	if not (deltainfo is None or targetsize is None):	122	if not (deltainfo is None or targetsize is None):
	384	msg = 'cannot use `targetsize` with a `deltainfo`'	123	msg = 'cannot use `targetsize` with a `deltainfo`'
	385	raise error.ProgrammingError(msg)	124	raise error.ProgrammingError(msg)
	386	for chunk in _slicechunktodensity(revlog, revs,	125	for chunk in _slicechunktodensity(revlog, revs,
	387	deltainfo,	126	deltainfo,
	388	revlog._srdensitythreshold,	127	revlog._srdensitythreshold,
	389	revlog._srmingapsize):	128	revlog._srmingapsize):
	390	for subchunk in _slicechunktosize(revlog, chunk, targetsize):	129	for subchunk in _slicechunktosize(revlog, chunk, targetsize):
	391	yield subchunk	130	yield subchunk
	392		131
	393	def _slicechunktosize(revlog, revs, targetsize=None):	132	def _slicechunktosize(revlog, revs, targetsize=None):
	394	"""slice revs to match the target size	133	"""slice revs to match the target size
	395		134
	396	This is intended to be used on chunk that density slicing selected by that	135	This is intended to be used on chunk that density slicing selected by that
	397	are still too large compared to the read garantee of revlog. This might	136	are still too large compared to the read garantee of revlog. This might
	398	happens when "minimal gap size" interrupted the slicing or when chain are	137	happens when "minimal gap size" interrupted the slicing or when chain are
	399	built in a way that create large blocks next to each other.	138	built in a way that create large blocks next to each other.
	400		139
	401	>>> revlog = _testrevlog([	140	>>> revlog = _testrevlog([
	402	... 3, #0 (3)	141	... 3, #0 (3)
	403	... 5, #1 (2)	142	... 5, #1 (2)
	404	... 6, #2 (1)	143	... 6, #2 (1)
	405	... 8, #3 (2)	144	... 8, #3 (2)
	406	... 8, #4 (empty)	145	... 8, #4 (empty)
	407	... 11, #5 (3)	146	... 11, #5 (3)
	408	... 12, #6 (1)	147	... 12, #6 (1)
	409	... 13, #7 (1)	148	... 13, #7 (1)
	410	... 14, #8 (1)	149	... 14, #8 (1)
	411	... ])	150	... ])
	412		151
	413	Cases where chunk is already small enough	152	Cases where chunk is already small enough
	414	>>> list(_slicechunktosize(revlog, [0], 3))	153	>>> list(_slicechunktosize(revlog, [0], 3))
	415	[[0]]	154	[[0]]
	416	>>> list(_slicechunktosize(revlog, [6, 7], 3))	155	>>> list(_slicechunktosize(revlog, [6, 7], 3))
	417	[[6, 7]]	156	[[6, 7]]
	418	>>> list(_slicechunktosize(revlog, [0], None))	157	>>> list(_slicechunktosize(revlog, [0], None))
	419	[[0]]	158	[[0]]
	420	>>> list(_slicechunktosize(revlog, [6, 7], None))	159	>>> list(_slicechunktosize(revlog, [6, 7], None))
	421	[[6, 7]]	160	[[6, 7]]
	422		161
	423	cases where we need actual slicing	162	cases where we need actual slicing
	424	>>> list(_slicechunktosize(revlog, [0, 1], 3))	163	>>> list(_slicechunktosize(revlog, [0, 1], 3))
	425	[[0], [1]]	164	[[0], [1]]
	426	>>> list(_slicechunktosize(revlog, [1, 3], 3))	165	>>> list(_slicechunktosize(revlog, [1, 3], 3))
	427	[[1], [3]]	166	[[1], [3]]
	428	>>> list(_slicechunktosize(revlog, [1, 2, 3], 3))	167	>>> list(_slicechunktosize(revlog, [1, 2, 3], 3))
	429	[[1, 2], [3]]	168	[[1, 2], [3]]
	430	>>> list(_slicechunktosize(revlog, [3, 5], 3))	169	>>> list(_slicechunktosize(revlog, [3, 5], 3))
	431	[[3], [5]]	170	[[3], [5]]
	432	>>> list(_slicechunktosize(revlog, [3, 4, 5], 3))	171	>>> list(_slicechunktosize(revlog, [3, 4, 5], 3))
	433	[[3], [5]]	172	[[3], [5]]
	434	>>> list(_slicechunktosize(revlog, [5, 6, 7, 8], 3))	173	>>> list(_slicechunktosize(revlog, [5, 6, 7, 8], 3))
	435	[[5], [6, 7, 8]]	174	[[5], [6, 7, 8]]
	436	>>> list(_slicechunktosize(revlog, [0, 1, 2, 3, 4, 5, 6, 7, 8], 3))	175	>>> list(_slicechunktosize(revlog, [0, 1, 2, 3, 4, 5, 6, 7, 8], 3))
	437	[[0], [1, 2], [3], [5], [6, 7, 8]]	176	[[0], [1, 2], [3], [5], [6, 7, 8]]
	438		177
	439	Case with too large individual chunk (must return valid chunk)	178	Case with too large individual chunk (must return valid chunk)
	440	>>> list(_slicechunktosize(revlog, [0, 1], 2))	179	>>> list(_slicechunktosize(revlog, [0, 1], 2))
	441	[[0], [1]]	180	[[0], [1]]
	442	>>> list(_slicechunktosize(revlog, [1, 3], 1))	181	>>> list(_slicechunktosize(revlog, [1, 3], 1))
	443	[[1], [3]]	182	[[1], [3]]
	444	>>> list(_slicechunktosize(revlog, [3, 4, 5], 2))	183	>>> list(_slicechunktosize(revlog, [3, 4, 5], 2))
	445	[[3], [5]]	184	[[3], [5]]
	446	"""	185	"""
	447	assert targetsize is None or 0 <= targetsize	186	assert targetsize is None or 0 <= targetsize
	448	if targetsize is None or _segmentspan(revlog, revs) <= targetsize:	187	if targetsize is None or segmentspan(revlog, revs) <= targetsize:
	449	yield revs	188	yield revs
	450	return	189	return
	451		190
	452	startrevidx = 0	191	startrevidx = 0
	453	startdata = revlog.start(revs[0])	192	startdata = revlog.start(revs[0])
	454	endrevidx = 0	193	endrevidx = 0
	455	iterrevs = enumerate(revs)	194	iterrevs = enumerate(revs)
	456	next(iterrevs) # skip first rev.	195	next(iterrevs) # skip first rev.
	457	for idx, r in iterrevs:	196	for idx, r in iterrevs:
	458	span = revlog.end(r) - startdata	197	span = revlog.end(r) - startdata
	459	if span <= targetsize:	198	if span <= targetsize:
	460	endrevidx = idx	199	endrevidx = idx
	461	else:	200	else:
	462	chunk = _trimchunk(revlog, revs, startrevidx, endrevidx + 1)	201	chunk = _trimchunk(revlog, revs, startrevidx, endrevidx + 1)
	463	if chunk:	202	if chunk:
	464	yield chunk	203	yield chunk
	465	startrevidx = idx	204	startrevidx = idx
	466	startdata = revlog.start(r)	205	startdata = revlog.start(r)
	467	endrevidx = idx	206	endrevidx = idx
	468	yield _trimchunk(revlog, revs, startrevidx)	207	yield _trimchunk(revlog, revs, startrevidx)
	469		208
	470	def _slicechunktodensity(revlog, revs, deltainfo=None, targetdensity=0.5,	209	def _slicechunktodensity(revlog, revs, deltainfo=None, targetdensity=0.5,
	471	mingapsize=0):	210	mingapsize=0):
	472	"""slice revs to reduce the amount of unrelated data to be read from disk.	211	"""slice revs to reduce the amount of unrelated data to be read from disk.
	473		212
	474	``revs`` is sliced into groups that should be read in one time.	213	``revs`` is sliced into groups that should be read in one time.
	475	Assume that revs are sorted.	214	Assume that revs are sorted.
	476		215
	477	``deltainfo`` is a _deltainfo instance of a revision that we would append	216	``deltainfo`` is a _deltainfo instance of a revision that we would append
	478	to the top of the revlog.	217	to the top of the revlog.
	479		218
	480	The initial chunk is sliced until the overall density (payload/chunks-span	219	The initial chunk is sliced until the overall density (payload/chunks-span
	481	ratio) is above `targetdensity`. No gap smaller than `mingapsize` is	220	ratio) is above `targetdensity`. No gap smaller than `mingapsize` is
	482	skipped.	221	skipped.
	483		222
	484	>>> revlog = _testrevlog([	223	>>> revlog = _testrevlog([
	485	... 5, #00 (5)	224	... 5, #00 (5)
	486	... 10, #01 (5)	225	... 10, #01 (5)
	487	... 12, #02 (2)	226	... 12, #02 (2)
	488	... 12, #03 (empty)	227	... 12, #03 (empty)
	489	... 27, #04 (15)	228	... 27, #04 (15)
	490	... 31, #05 (4)	229	... 31, #05 (4)
	491	... 31, #06 (empty)	230	... 31, #06 (empty)
	492	... 42, #07 (11)	231	... 42, #07 (11)
	493	... 47, #08 (5)	232	... 47, #08 (5)
	494	... 47, #09 (empty)	233	... 47, #09 (empty)
	495	... 48, #10 (1)	234	... 48, #10 (1)
	496	... 51, #11 (3)	235	... 51, #11 (3)
	497	... 74, #12 (23)	236	... 74, #12 (23)
	498	... 85, #13 (11)	237	... 85, #13 (11)
	499	... 86, #14 (1)	238	... 86, #14 (1)
	500	... 91, #15 (5)	239	... 91, #15 (5)
	501	... ])	240	... ])
	502		241
	503	>>> list(_slicechunktodensity(revlog, list(range(16))))	242	>>> list(_slicechunktodensity(revlog, list(range(16))))
	504	[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]	243	[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
	505	>>> list(_slicechunktodensity(revlog, [0, 15]))	244	>>> list(_slicechunktodensity(revlog, [0, 15]))
	506	[[0], [15]]	245	[[0], [15]]
	507	>>> list(_slicechunktodensity(revlog, [0, 11, 15]))	246	>>> list(_slicechunktodensity(revlog, [0, 11, 15]))
	508	[[0], [11], [15]]	247	[[0], [11], [15]]
	509	>>> list(_slicechunktodensity(revlog, [0, 11, 13, 15]))	248	>>> list(_slicechunktodensity(revlog, [0, 11, 13, 15]))
	510	[[0], [11, 13, 15]]	249	[[0], [11, 13, 15]]
	511	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))	250	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
	512	[[1, 2], [5, 8, 10, 11], [14]]	251	[[1, 2], [5, 8, 10, 11], [14]]
	513	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],	252	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
	514	... mingapsize=20))	253	... mingapsize=20))
	515	[[1, 2, 3, 5, 8, 10, 11], [14]]	254	[[1, 2, 3, 5, 8, 10, 11], [14]]
	516	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],	255	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
	517	... targetdensity=0.95))	256	... targetdensity=0.95))
	518	[[1, 2], [5], [8, 10, 11], [14]]	257	[[1, 2], [5], [8, 10, 11], [14]]
	519	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],	258	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
	520	... targetdensity=0.95, mingapsize=12))	259	... targetdensity=0.95, mingapsize=12))
	521	[[1, 2], [5, 8, 10, 11], [14]]	260	[[1, 2], [5, 8, 10, 11], [14]]
	522	"""	261	"""
	523	start = revlog.start	262	start = revlog.start
	524	length = revlog.length	263	length = revlog.length
	525		264
	526	if len(revs) <= 1:	265	if len(revs) <= 1:
	527	yield revs	266	yield revs
	528	return	267	return
	529		268
	530	nextrev = len(revlog)	269	nextrev = len(revlog)
	531	nextoffset = revlog.end(nextrev - 1)	270	nextoffset = revlog.end(nextrev - 1)
	532		271
	533	if deltainfo is None:	272	if deltainfo is None:
	534	deltachainspan = _segmentspan(revlog, revs)	273	deltachainspan = segmentspan(revlog, revs)
	535	chainpayload = sum(length(r) for r in revs)	274	chainpayload = sum(length(r) for r in revs)
	536	else:	275	else:
	537	deltachainspan = deltainfo.distance	276	deltachainspan = deltainfo.distance
	538	chainpayload = deltainfo.compresseddeltalen	277	chainpayload = deltainfo.compresseddeltalen
	539		278
	540	if deltachainspan < mingapsize:	279	if deltachainspan < mingapsize:
	541	yield revs	280	yield revs
	542	return	281	return
	543		282
	544	readdata = deltachainspan	283	readdata = deltachainspan
	545		284
	546	if deltachainspan:	285	if deltachainspan:
	547	density = chainpayload / float(deltachainspan)	286	density = chainpayload / float(deltachainspan)
	548	else:	287	else:
	549	density = 1.0	288	density = 1.0
	550		289
	551	if density >= targetdensity:	290	if density >= targetdensity:
	552	yield revs	291	yield revs
	553	return	292	return
	554		293
	555	if deltainfo is not None and deltainfo.deltalen:	294	if deltainfo is not None and deltainfo.deltalen:
	556	revs = list(revs)	295	revs = list(revs)
	557	revs.append(nextrev)	296	revs.append(nextrev)
	558		297
	559	# Store the gaps in a heap to have them sorted by decreasing size	298	# Store the gaps in a heap to have them sorted by decreasing size
	560	gapsheap = []	299	gapsheap = []
	561	heapq.heapify(gapsheap)	300	heapq.heapify(gapsheap)
	562	prevend = None	301	prevend = None
	563	for i, rev in enumerate(revs):	302	for i, rev in enumerate(revs):
	564	if rev < nextrev:	303	if rev < nextrev:
	565	revstart = start(rev)	304	revstart = start(rev)
	566	revlen = length(rev)	305	revlen = length(rev)
	567	else:	306	else:
	568	revstart = nextoffset	307	revstart = nextoffset
	569	revlen = deltainfo.deltalen	308	revlen = deltainfo.deltalen
	570		309
	571	# Skip empty revisions to form larger holes	310	# Skip empty revisions to form larger holes
	572	if revlen == 0:	311	if revlen == 0:
	573	continue	312	continue
	574		313
	575	if prevend is not None:	314	if prevend is not None:
	576	gapsize = revstart - prevend	315	gapsize = revstart - prevend
	577	# only consider holes that are large enough	316	# only consider holes that are large enough
	578	if gapsize > mingapsize:	317	if gapsize > mingapsize:
	579	heapq.heappush(gapsheap, (-gapsize, i))	318	heapq.heappush(gapsheap, (-gapsize, i))
	580		319
	581	prevend = revstart + revlen	320	prevend = revstart + revlen
	582		321
	583	# Collect the indices of the largest holes until the density is acceptable	322	# Collect the indices of the largest holes until the density is acceptable
	584	indicesheap = []	323	indicesheap = []
	585	heapq.heapify(indicesheap)	324	heapq.heapify(indicesheap)
	586	while gapsheap and density < targetdensity:	325	while gapsheap and density < targetdensity:
	587	oppgapsize, gapidx = heapq.heappop(gapsheap)	326	oppgapsize, gapidx = heapq.heappop(gapsheap)
	588		327
	589	heapq.heappush(indicesheap, gapidx)	328	heapq.heappush(indicesheap, gapidx)
	590		329
	591	# the gap sizes are stored as negatives to be sorted decreasingly	330	# the gap sizes are stored as negatives to be sorted decreasingly
	592	# by the heap	331	# by the heap
	593	readdata -= (-oppgapsize)	332	readdata -= (-oppgapsize)
	594	if readdata > 0:	333	if readdata > 0:
	595	density = chainpayload / float(readdata)	334	density = chainpayload / float(readdata)
	596	else:	335	else:
	597	density = 1.0	336	density = 1.0
	598		337
	599	# Cut the revs at collected indices	338	# Cut the revs at collected indices
	600	previdx = 0	339	previdx = 0
	601	while indicesheap:	340	while indicesheap:
	602	idx = heapq.heappop(indicesheap)	341	idx = heapq.heappop(indicesheap)
	603		342
	604	chunk = _trimchunk(revlog, revs, previdx, idx)	343	chunk = _trimchunk(revlog, revs, previdx, idx)
	605	if chunk:	344	if chunk:
	606	yield chunk	345	yield chunk
	607		346
	608	previdx = idx	347	previdx = idx
	609		348
	610	chunk = _trimchunk(revlog, revs, previdx)	349	chunk = _trimchunk(revlog, revs, previdx)
	611	if chunk:	350	if chunk:
	612	yield chunk	351	yield chunk
	613		352
			353	def _trimchunk(revlog, revs, startidx, endidx=None):
			354	"""returns revs[startidx:endidx] without empty trailing revs
			355
			356	Doctest Setup
			357	>>> revlog = _testrevlog([
			358	... 5, #0
			359	... 10, #1
			360	... 12, #2
			361	... 12, #3 (empty)
			362	... 17, #4
			363	... 21, #5
			364	... 21, #6 (empty)
			365	... ])
			366
			367	Contiguous cases:
			368	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0)
			369	[0, 1, 2, 3, 4, 5]
			370	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 5)
			371	[0, 1, 2, 3, 4]
			372	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 4)
			373	[0, 1, 2]
			374	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 2, 4)
			375	[2]
			376	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3)
			377	[3, 4, 5]
			378	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3, 5)
			379	[3, 4]
			380
			381	Discontiguous cases:
			382	>>> _trimchunk(revlog, [1, 3, 5, 6], 0)
			383	[1, 3, 5]
			384	>>> _trimchunk(revlog, [1, 3, 5, 6], 0, 2)
			385	[1]
			386	>>> _trimchunk(revlog, [1, 3, 5, 6], 1, 3)
			387	[3, 5]
			388	>>> _trimchunk(revlog, [1, 3, 5, 6], 1)
			389	[3, 5]
			390	"""
			391	length = revlog.length
			392
			393	if endidx is None:
			394	endidx = len(revs)
			395
			396	# If we have a non-emtpy delta candidate, there are nothing to trim
			397	if revs[endidx - 1] < len(revlog):
			398	# Trim empty revs at the end, except the very first revision of a chain
			399	while (endidx > 1
			400	and endidx > startidx
			401	and length(revs[endidx - 1]) == 0):
			402	endidx -= 1
			403
			404	return revs[startidx:endidx]
			405
			406	def segmentspan(revlog, revs, deltainfo=None):
			407	"""Get the byte span of a segment of revisions
			408
			409	revs is a sorted array of revision numbers
			410
			411	>>> revlog = _testrevlog([
			412	... 5, #0
			413	... 10, #1
			414	... 12, #2
			415	... 12, #3 (empty)
			416	... 17, #4
			417	... ])
			418
			419	>>> segmentspan(revlog, [0, 1, 2, 3, 4])
			420	17
			421	>>> segmentspan(revlog, [0, 4])
			422	17
			423	>>> segmentspan(revlog, [3, 4])
			424	5
			425	>>> segmentspan(revlog, [1, 2, 3,])
			426	7
			427	>>> segmentspan(revlog, [1, 3])
			428	7
			429	"""
			430	if not revs:
			431	return 0
			432	if deltainfo is not None and len(revlog) <= revs[-1]:
			433	if len(revs) == 1:
			434	return deltainfo.deltalen
			435	offset = revlog.end(len(revlog) - 1)
			436	end = deltainfo.deltalen + offset
			437	else:
			438	end = revlog.end(revs[-1])
			439	return end - revlog.start(revs[0])
			440
	614	@attr.s(slots=True, frozen=True)	441	@attr.s(slots=True, frozen=True)
	615	class _deltainfo(object):	442	class _deltainfo(object):
	616	distance = attr.ib()	443	distance = attr.ib()
	617	deltalen = attr.ib()	444	deltalen = attr.ib()
	618	data = attr.ib()	445	data = attr.ib()
	619	base = attr.ib()	446	base = attr.ib()
	620	chainbase = attr.ib()	447	chainbase = attr.ib()
	621	chainlen = attr.ib()	448	chainlen = attr.ib()
	622	compresseddeltalen = attr.ib()	449	compresseddeltalen = attr.ib()
	623	snapshotdepth = attr.ib()	450	snapshotdepth = attr.ib()
	624		451
	625	class _deltacomputer(object):	452	def isgooddeltainfo(revlog, deltainfo, revinfo):
			453	"""Returns True if the given delta is good. Good means that it is within
			454	the disk span, disk size, and chain length bounds that we know to be
			455	performant."""
			456	if deltainfo is None:
			457	return False
			458
			459	# - 'deltainfo.distance' is the distance from the base revision --
			460	# bounding it limits the amount of I/O we need to do.
			461	# - 'deltainfo.compresseddeltalen' is the sum of the total size of
			462	# deltas we need to apply -- bounding it limits the amount of CPU
			463	# we consume.
			464
			465	if revlog._sparserevlog:
			466	# As sparse-read will be used, we can consider that the distance,
			467	# instead of being the span of the whole chunk,
			468	# is the span of the largest read chunk
			469	base = deltainfo.base
			470
			471	if base != nullrev:
			472	deltachain = revlog._deltachain(base)[0]
			473	else:
			474	deltachain = []
			475
			476	# search for the first non-snapshot revision
			477	for idx, r in enumerate(deltachain):
			478	if not revlog.issnapshot(r):
			479	break
			480	deltachain = deltachain[idx:]
			481	chunks = slicechunk(revlog, deltachain, deltainfo)
			482	all_span = [segmentspan(revlog, revs, deltainfo)
			483	for revs in chunks]
			484	distance = max(all_span)
			485	else:
			486	distance = deltainfo.distance
			487
			488	textlen = revinfo.textlen
			489	defaultmax = textlen * 4
			490	maxdist = revlog._maxdeltachainspan
			491	if not maxdist:
			492	maxdist = distance # ensure the conditional pass
			493	maxdist = max(maxdist, defaultmax)
			494	if revlog._sparserevlog and maxdist < revlog._srmingapsize:
			495	# In multiple place, we are ignoring irrelevant data range below a
			496	# certain size. Be also apply this tradeoff here and relax span
			497	# constraint for small enought content.
			498	maxdist = revlog._srmingapsize
			499
			500	# Bad delta from read span:
			501	#
			502	# If the span of data read is larger than the maximum allowed.
			503	if maxdist < distance:
			504	return False
			505
			506	# Bad delta from new delta size:
			507	#
			508	# If the delta size is larger than the target text, storing the
			509	# delta will be inefficient.
			510	if textlen < deltainfo.deltalen:
			511	return False
			512
			513	# Bad delta from cumulated payload size:
			514	#
			515	# If the sum of delta get larger than K * target text length.
			516	if textlen * LIMIT_DELTA2TEXT < deltainfo.compresseddeltalen:
			517	return False
			518
			519	# Bad delta from chain length:
			520	#
			521	# If the number of delta in the chain gets too high.
			522	if (revlog._maxchainlen
			523	and revlog._maxchainlen < deltainfo.chainlen):
			524	return False
			525
			526	# bad delta from intermediate snapshot size limit
			527	#
			528	# If an intermediate snapshot size is higher than the limit. The
			529	# limit exist to prevent endless chain of intermediate delta to be
			530	# created.
			531	if (deltainfo.snapshotdepth is not None and
			532	(textlen >> deltainfo.snapshotdepth) < deltainfo.deltalen):
			533	return False
			534
			535	# bad delta if new intermediate snapshot is larger than the previous
			536	# snapshot
			537	if (deltainfo.snapshotdepth
			538	and revlog.length(deltainfo.base) < deltainfo.deltalen):
			539	return False
			540
			541	return True
			542
			543	class deltacomputer(object):
	626	def __init__(self, revlog):	544	def __init__(self, revlog):
	627	self.revlog = revlog	545	self.revlog = revlog
	628		546
	629	def _getcandidaterevs(self, p1, p2, cachedelta):	547	def _getcandidaterevs(self, p1, p2, cachedelta):
	630	"""	548	"""
	631	Provides revisions that present an interest to be diffed against,	549	Provides revisions that present an interest to be diffed against,
	632	grouped by level of easiness.	550	grouped by level of easiness.
	633	"""	551	"""
	634	revlog = self.revlog	552	revlog = self.revlog
	635	gdelta = revlog._generaldelta	553	gdelta = revlog._generaldelta
	636	curr = len(revlog)	554	curr = len(revlog)
	637	prev = curr - 1	555	prev = curr - 1
	638	p1r, p2r = revlog.rev(p1), revlog.rev(p2)	556	p1r, p2r = revlog.rev(p1), revlog.rev(p2)
	639		557
	640	# should we try to build a delta?	558	# should we try to build a delta?
	641	if prev != nullrev and revlog._storedeltachains:	559	if prev != nullrev and revlog._storedeltachains:
	642	tested = set()	560	tested = set()
	643	# This condition is true most of the time when processing	561	# This condition is true most of the time when processing
	644	# changegroup data into a generaldelta repo. The only time it	562	# changegroup data into a generaldelta repo. The only time it
	645	# isn't true is if this is the first revision in a delta chain	563	# isn't true is if this is the first revision in a delta chain
	646	# or if ``format.generaldelta=true`` disabled ``lazydeltabase``.	564	# or if ``format.generaldelta=true`` disabled ``lazydeltabase``.
	647	if cachedelta and gdelta and revlog._lazydeltabase:	565	if cachedelta and gdelta and revlog._lazydeltabase:
	648	# Assume what we received from the server is a good choice	566	# Assume what we received from the server is a good choice
	649	# build delta will reuse the cache	567	# build delta will reuse the cache
	650	yield (cachedelta[0],)	568	yield (cachedelta[0],)
	651	tested.add(cachedelta[0])	569	tested.add(cachedelta[0])
	652		570
	653	if gdelta:	571	if gdelta:
	654	# exclude already lazy tested base if any	572	# exclude already lazy tested base if any
	655	parents = [p for p in (p1r, p2r)	573	parents = [p for p in (p1r, p2r)
	656	if p != nullrev and p not in tested]	574	if p != nullrev and p not in tested]
	657		575
	658	if not revlog._deltabothparents and len(parents) == 2:	576	if not revlog._deltabothparents and len(parents) == 2:
	659	parents.sort()	577	parents.sort()
	660	# To minimize the chance of having to build a fulltext,	578	# To minimize the chance of having to build a fulltext,
	661	# pick first whichever parent is closest to us (max rev)	579	# pick first whichever parent is closest to us (max rev)
	662	yield (parents[1],)	580	yield (parents[1],)
	663	# then the other one (min rev) if the first did not fit	581	# then the other one (min rev) if the first did not fit
	664	yield (parents[0],)	582	yield (parents[0],)
	665	tested.update(parents)	583	tested.update(parents)
	666	elif len(parents) > 0:	584	elif len(parents) > 0:
	667	# Test all parents (1 or 2), and keep the best candidate	585	# Test all parents (1 or 2), and keep the best candidate
	668	yield parents	586	yield parents
	669	tested.update(parents)	587	tested.update(parents)
	670		588
	671	if prev not in tested:	589	if prev not in tested:
	672	# other approach failed try against prev to hopefully save us a	590	# other approach failed try against prev to hopefully save us a
	673	# fulltext.	591	# fulltext.
	674	yield (prev,)	592	yield (prev,)
	675	tested.add(prev)	593	tested.add(prev)
	676		594
	677	def buildtext(self, revinfo, fh):	595	def buildtext(self, revinfo, fh):
	678	"""Builds a fulltext version of a revision	596	"""Builds a fulltext version of a revision
	679		597
	680	revinfo: _revisioninfo instance that contains all needed info	598	revinfo: _revisioninfo instance that contains all needed info
	681	fh: file handle to either the .i or the .d revlog file,	599	fh: file handle to either the .i or the .d revlog file,
	682	depending on whether it is inlined or not	600	depending on whether it is inlined or not
	683	"""	601	"""
	684	btext = revinfo.btext	602	btext = revinfo.btext
	685	if btext[0] is not None:	603	if btext[0] is not None:
	686	return btext[0]	604	return btext[0]
	687		605
	688	revlog = self.revlog	606	revlog = self.revlog
	689	cachedelta = revinfo.cachedelta	607	cachedelta = revinfo.cachedelta
	690	flags = revinfo.flags	608	flags = revinfo.flags
	691	node = revinfo.node	609	node = revinfo.node
	692		610
	693	baserev = cachedelta[0]	611	baserev = cachedelta[0]
	694	delta = cachedelta[1]	612	delta = cachedelta[1]
	695	# special case deltas which replace entire base; no need to decode	613	# special case deltas which replace entire base; no need to decode
	696	# base revision. this neatly avoids censored bases, which throw when	614	# base revision. this neatly avoids censored bases, which throw when
	697	# they're decoded.	615	# they're decoded.
	698	hlen = struct.calcsize(">lll")	616	hlen = struct.calcsize(">lll")
	699	if delta[:hlen] == mdiff.replacediffheader(revlog.rawsize(baserev),	617	if delta[:hlen] == mdiff.replacediffheader(revlog.rawsize(baserev),
	700	len(delta) - hlen):	618	len(delta) - hlen):
	701	btext[0] = delta[hlen:]	619	btext[0] = delta[hlen:]
	702	else:	620	else:
	703	# deltabase is rawtext before changed by flag processors, which is	621	# deltabase is rawtext before changed by flag processors, which is
	704	# equivalent to non-raw text	622	# equivalent to non-raw text
	705	basetext = revlog.revision(baserev, _df=fh, raw=False)	623	basetext = revlog.revision(baserev, _df=fh, raw=False)
	706	btext[0] = mdiff.patch(basetext, delta)	624	btext[0] = mdiff.patch(basetext, delta)
	707		625
	708	try:	626	try:
	709	res = revlog._processflags(btext[0], flags, 'read', raw=True)	627	res = revlog._processflags(btext[0], flags, 'read', raw=True)
	710	btext[0], validatehash = res	628	btext[0], validatehash = res
	711	if validatehash:	629	if validatehash:
	712	revlog.checkhash(btext[0], node, p1=revinfo.p1, p2=revinfo.p2)	630	revlog.checkhash(btext[0], node, p1=revinfo.p1, p2=revinfo.p2)
	713	if flags & REVIDX_ISCENSORED:	631	if flags & REVIDX_ISCENSORED:
	714	raise RevlogError(_('node %s is not censored') % node)	632	raise RevlogError(_('node %s is not censored') % node)
	715	except CensoredNodeError:	633	except CensoredNodeError:
	716	# must pass the censored index flag to add censored revisions	634	# must pass the censored index flag to add censored revisions
	717	if not flags & REVIDX_ISCENSORED:	635	if not flags & REVIDX_ISCENSORED:
	718	raise	636	raise
	719	return btext[0]	637	return btext[0]
	720		638
	721	def _builddeltadiff(self, base, revinfo, fh):	639	def _builddeltadiff(self, base, revinfo, fh):
	722	revlog = self.revlog	640	revlog = self.revlog
	723	t = self.buildtext(revinfo, fh)	641	t = self.buildtext(revinfo, fh)
	724	if revlog.iscensored(base):	642	if revlog.iscensored(base):
	725	# deltas based on a censored revision must replace the	643	# deltas based on a censored revision must replace the
	726	# full content in one patch, so delta works everywhere	644	# full content in one patch, so delta works everywhere
	727	header = mdiff.replacediffheader(revlog.rawsize(base), len(t))	645	header = mdiff.replacediffheader(revlog.rawsize(base), len(t))
	728	delta = header + t	646	delta = header + t
	729	else:	647	else:
	730	ptext = revlog.revision(base, _df=fh, raw=True)	648	ptext = revlog.revision(base, _df=fh, raw=True)
	731	delta = mdiff.textdiff(ptext, t)	649	delta = mdiff.textdiff(ptext, t)
	732		650
	733	return delta	651	return delta
	734		652
	735	def _builddeltainfo(self, revinfo, base, fh):	653	def _builddeltainfo(self, revinfo, base, fh):
	736	# can we use the cached delta?	654	# can we use the cached delta?
	737	if revinfo.cachedelta and revinfo.cachedelta[0] == base:	655	if revinfo.cachedelta and revinfo.cachedelta[0] == base:
	738	delta = revinfo.cachedelta[1]	656	delta = revinfo.cachedelta[1]
	739	else:	657	else:
	740	delta = self._builddeltadiff(base, revinfo, fh)	658	delta = self._builddeltadiff(base, revinfo, fh)
	741	revlog = self.revlog	659	revlog = self.revlog
	742	header, data = revlog.compress(delta)	660	header, data = revlog.compress(delta)
	743	deltalen = len(header) + len(data)	661	deltalen = len(header) + len(data)
	744	chainbase = revlog.chainbase(base)	662	chainbase = revlog.chainbase(base)
	745	offset = revlog.end(len(revlog) - 1)	663	offset = revlog.end(len(revlog) - 1)
	746	dist = deltalen + offset - revlog.start(chainbase)	664	dist = deltalen + offset - revlog.start(chainbase)
	747	if revlog._generaldelta:	665	if revlog._generaldelta:
	748	deltabase = base	666	deltabase = base
	749	else:	667	else:
	750	deltabase = chainbase	668	deltabase = chainbase
	751	chainlen, compresseddeltalen = revlog._chaininfo(base)	669	chainlen, compresseddeltalen = revlog._chaininfo(base)
	752	chainlen += 1	670	chainlen += 1
	753	compresseddeltalen += deltalen	671	compresseddeltalen += deltalen
	754		672
	755	revlog = self.revlog	673	revlog = self.revlog
	756	snapshotdepth = None	674	snapshotdepth = None
	757	if deltabase == nullrev:	675	if deltabase == nullrev:
	758	snapshotdepth = 0	676	snapshotdepth = 0
	759	elif revlog._sparserevlog and revlog.issnapshot(deltabase):	677	elif revlog._sparserevlog and revlog.issnapshot(deltabase):
	760	# A delta chain should always be one full snapshot,	678	# A delta chain should always be one full snapshot,
	761	# zero or more semi-snapshots, and zero or more deltas	679	# zero or more semi-snapshots, and zero or more deltas
	762	p1, p2 = revlog.rev(revinfo.p1), revlog.rev(revinfo.p2)	680	p1, p2 = revlog.rev(revinfo.p1), revlog.rev(revinfo.p2)
	763	if deltabase not in (p1, p2) and revlog.issnapshot(deltabase):	681	if deltabase not in (p1, p2) and revlog.issnapshot(deltabase):
	764	snapshotdepth = len(revlog._deltachain(deltabase)[0])	682	snapshotdepth = len(revlog._deltachain(deltabase)[0])
	765		683
	766	return _deltainfo(dist, deltalen, (header, data), deltabase,	684	return _deltainfo(dist, deltalen, (header, data), deltabase,
	767	chainbase, chainlen, compresseddeltalen,	685	chainbase, chainlen, compresseddeltalen,
	768	snapshotdepth)	686	snapshotdepth)
	769		687
	770	def finddeltainfo(self, revinfo, fh):	688	def finddeltainfo(self, revinfo, fh):
	771	"""Find an acceptable delta against a candidate revision	689	"""Find an acceptable delta against a candidate revision
	772		690
	773	revinfo: information about the revision (instance of _revisioninfo)	691	revinfo: information about the revision (instance of _revisioninfo)
	774	fh: file handle to either the .i or the .d revlog file,	692	fh: file handle to either the .i or the .d revlog file,
	775	depending on whether it is inlined or not	693	depending on whether it is inlined or not
	776		694
	777	Returns the first acceptable candidate revision, as ordered by	695	Returns the first acceptable candidate revision, as ordered by
	778	_getcandidaterevs	696	_getcandidaterevs
	779	"""	697	"""
	780	if not revinfo.textlen:	698	if not revinfo.textlen:
	781	return None # empty file do not need delta	699	return None # empty file do not need delta
	782		700
	783	cachedelta = revinfo.cachedelta	701	cachedelta = revinfo.cachedelta
	784	p1 = revinfo.p1	702	p1 = revinfo.p1
	785	p2 = revinfo.p2	703	p2 = revinfo.p2
	786	revlog = self.revlog	704	revlog = self.revlog
	787		705
	788	deltalength = self.revlog.length	706	deltalength = self.revlog.length
	789	deltaparent = self.revlog.deltaparent	707	deltaparent = self.revlog.deltaparent
	790		708
	791	deltainfo = None	709	deltainfo = None
	792	deltas_limit = revinfo.textlen * LIMIT_DELTA2TEXT	710	deltas_limit = revinfo.textlen * LIMIT_DELTA2TEXT
	793	for candidaterevs in self._getcandidaterevs(p1, p2, cachedelta):	711	for candidaterevs in self._getcandidaterevs(p1, p2, cachedelta):
	794	# filter out delta base that will never produce good delta	712	# filter out delta base that will never produce good delta
	795	candidaterevs = [r for r in candidaterevs	713	candidaterevs = [r for r in candidaterevs
	796	if self.revlog.length(r) <= deltas_limit]	714	if self.revlog.length(r) <= deltas_limit]
	797	nominateddeltas = []	715	nominateddeltas = []
	798	for candidaterev in candidaterevs:	716	for candidaterev in candidaterevs:
	799	# skip over empty delta (no need to include them in a chain)	717	# skip over empty delta (no need to include them in a chain)
	800	while candidaterev != nullrev and not deltalength(candidaterev):	718	while candidaterev != nullrev and not deltalength(candidaterev):
	801	candidaterev = deltaparent(candidaterev)	719	candidaterev = deltaparent(candidaterev)
	802	# no need to try a delta against nullid, this will be handled	720	# no need to try a delta against nullid, this will be handled
	803	# by fulltext later.	721	# by fulltext later.
	804	if candidaterev == nullrev:	722	if candidaterev == nullrev:
	805	continue	723	continue
	806	# no delta for rawtext-changing revs (see "candelta" for why)	724	# no delta for rawtext-changing revs (see "candelta" for why)
	807	if revlog.flags(candidaterev) & REVIDX_RAWTEXT_CHANGING_FLAGS:	725	if revlog.flags(candidaterev) & REVIDX_RAWTEXT_CHANGING_FLAGS:
	808	continue	726	continue
	809	candidatedelta = self._builddeltainfo(revinfo, candidaterev, fh)	727	candidatedelta = self._builddeltainfo(revinfo, candidaterev, fh)
	810	if revlog.~~_isgooddeltainfo~~(candidatedelta, revinfo):	728	if isgooddeltainfo(self.revlog, candidatedelta, revinfo):
	811	nominateddeltas.append(candidatedelta)	729	nominateddeltas.append(candidatedelta)
	812	if nominateddeltas:	730	if nominateddeltas:
	813	deltainfo = min(nominateddeltas, key=lambda x: x.deltalen)	731	deltainfo = min(nominateddeltas, key=lambda x: x.deltalen)
	814	break	732	break
	815		733
	816	return deltainfo	734	return deltainfo
	817
	818	@attr.s(slots=True, frozen=True)
	819	class _revisioninfo(object):
	820	"""Information about a revision that allows building its fulltext
	821	node: expected hash of the revision
	822	p1, p2: parent revs of the revision
	823	btext: built text cache consisting of a one-element list
	824	cachedelta: (baserev, uncompressed_delta) or None
	825	flags: flags associated to the revision storage
	826
	827	One of btext[0] or cachedelta must be set.
	828	"""
	829	node = attr.ib()
	830	p1 = attr.ib()
	831	p2 = attr.ib()
	832	btext = attr.ib()
	833	textlen = attr.ib()
	834	cachedelta = attr.ib()
	835	flags = attr.ib()
	836
	837	@interfaceutil.implementer(repository.irevisiondelta)
	838	@attr.s(slots=True, frozen=True)
	839	class revlogrevisiondelta(object):
	840	node = attr.ib()
	841	p1node = attr.ib()
	842	p2node = attr.ib()
	843	basenode = attr.ib()
	844	linknode = attr.ib()
	845	flags = attr.ib()
	846	baserevisionsize = attr.ib()
	847	revision = attr.ib()
	848	delta = attr.ib()
	849
	850	# index v0:
	851	# 4 bytes: offset
	852	# 4 bytes: compressed length
	853	# 4 bytes: base rev
	854	# 4 bytes: link rev
	855	# 20 bytes: parent 1 nodeid
	856	# 20 bytes: parent 2 nodeid
	857	# 20 bytes: nodeid
	858	indexformatv0 = struct.Struct(">4l20s20s20s")
	859	indexformatv0_pack = indexformatv0.pack
	860	indexformatv0_unpack = indexformatv0.unpack
	861
	862	class revlogoldindex(list):
	863	def __getitem__(self, i):
	864	if i == -1:
	865	return (0, 0, 0, -1, -1, -1, -1, nullid)
	866	return list.__getitem__(self, i)
	867
	868	class revlogoldio(object):
	869	def __init__(self):
	870	self.size = indexformatv0.size
	871
	872	def parseindex(self, data, inline):
	873	s = self.size
	874	index = []
	875	nodemap = {nullid: nullrev}
	876	n = off = 0
	877	l = len(data)
	878	while off + s <= l:
	879	cur = data[off:off + s]
	880	off += s
	881	e = indexformatv0_unpack(cur)
	882	# transform to revlogv1 format
	883	e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
	884	nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
	885	index.append(e2)
	886	nodemap[e[6]] = n
	887	n += 1
	888
	889	return revlogoldindex(index), nodemap, None
	890
	891	def packentry(self, entry, node, version, rev):
	892	if gettype(entry[0]):
	893	raise RevlogError(_('index entry flags need revlog version 1'))
	894	e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
	895	node(entry[5]), node(entry[6]), entry[7])
	896	return indexformatv0_pack(*e2)
	897
	898	# index ng:
	899	# 6 bytes: offset
	900	# 2 bytes: flags
	901	# 4 bytes: compressed length
	902	# 4 bytes: uncompressed length
	903	# 4 bytes: base rev
	904	# 4 bytes: link rev
	905	# 4 bytes: parent 1 rev
	906	# 4 bytes: parent 2 rev
	907	# 32 bytes: nodeid
	908	indexformatng = struct.Struct(">Qiiiiii20s12x")
	909	indexformatng_pack = indexformatng.pack
	910	versionformat = struct.Struct(">I")
	911	versionformat_pack = versionformat.pack
	912	versionformat_unpack = versionformat.unpack
	913
	914	# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
	915	# signed integer)
	916	_maxentrysize = 0x7fffffff
	917
	918	class revlogio(object):
	919	def __init__(self):
	920	self.size = indexformatng.size
	921
	922	def parseindex(self, data, inline):
	923	# call the C implementation to parse the index data
	924	index, cache = parsers.parse_index2(data, inline)
	925	return index, getattr(index, 'nodemap', None), cache
	926
	927	def packentry(self, entry, node, version, rev):
	928	p = indexformatng_pack(*entry)
	929	if rev == 0:
	930	p = versionformat_pack(version) + p[4:]
	931	return p
	932
	933	class revlog(object):
	934	"""
	935	the underlying revision storage object
	936
	937	A revlog consists of two parts, an index and the revision data.
	938
	939	The index is a file with a fixed record size containing
	940	information on each revision, including its nodeid (hash), the
	941	nodeids of its parents, the position and offset of its data within
	942	the data file, and the revision it's based on. Finally, each entry
	943	contains a linkrev entry that can serve as a pointer to external
	944	data.
	945
	946	The revision data itself is a linear collection of data chunks.
	947	Each chunk represents a revision and is usually represented as a
	948	delta against the previous chunk. To bound lookup time, runs of
	949	deltas are limited to about 2 times the length of the original
	950	version data. This makes retrieval of a version proportional to
	951	its size, or O(1) relative to the number of revisions.
	952
	953	Both pieces of the revlog are written to in an append-only
	954	fashion, which means we never need to rewrite a file to insert or
	955	remove data, and can use some simple techniques to avoid the need
	956	for locking while reading.
	957
	958	If checkambig, indexfile is opened with checkambig=True at
	959	writing, to avoid file stat ambiguity.
	960
	961	If mmaplargeindex is True, and an mmapindexthreshold is set, the
	962	index will be mmapped rather than read if it is larger than the
	963	configured threshold.
	964
	965	If censorable is True, the revlog can have censored revisions.
	966	"""
	967	def __init__(self, opener, indexfile, datafile=None, checkambig=False,
	968	mmaplargeindex=False, censorable=False):
	969	"""
	970	create a revlog object
	971
	972	opener is a function that abstracts the file opening operation
	973	and can be used to implement COW semantics or the like.
	974	"""
	975	self.indexfile = indexfile
	976	self.datafile = datafile or (indexfile[:-2] + ".d")
	977	self.opener = opener
	978	# When True, indexfile is opened with checkambig=True at writing, to
	979	# avoid file stat ambiguity.
	980	self._checkambig = checkambig
	981	self._censorable = censorable
	982	# 3-tuple of (node, rev, text) for a raw revision.
	983	self._cache = None
	984	# Maps rev to chain base rev.
	985	self._chainbasecache = util.lrucachedict(100)
	986	# 2-tuple of (offset, data) of raw data from the revlog at an offset.
	987	self._chunkcache = (0, '')
	988	# How much data to read and cache into the raw revlog data cache.
	989	self._chunkcachesize = 65536
	990	self._maxchainlen = None
	991	self._deltabothparents = True
	992	self.index = []
	993	# Mapping of partial identifiers to full nodes.
	994	self._pcache = {}
	995	# Mapping of revision integer to full node.
	996	self._nodecache = {nullid: nullrev}
	997	self._nodepos = None
	998	self._compengine = 'zlib'
	999	self._maxdeltachainspan = -1
	1000	self._withsparseread = False
	1001	self._sparserevlog = False
	1002	self._srdensitythreshold = 0.50
	1003	self._srmingapsize = 262144
	1004
	1005	mmapindexthreshold = None
	1006	v = REVLOG_DEFAULT_VERSION
	1007	opts = getattr(opener, 'options', None)
	1008	if opts is not None:
	1009	if 'revlogv2' in opts:
	1010	# version 2 revlogs always use generaldelta.
	1011	v = REVLOGV2 \| FLAG_GENERALDELTA \| FLAG_INLINE_DATA
	1012	elif 'revlogv1' in opts:
	1013	if 'generaldelta' in opts:
	1014	v \|= FLAG_GENERALDELTA
	1015	else:
	1016	v = 0
	1017	if 'chunkcachesize' in opts:
	1018	self._chunkcachesize = opts['chunkcachesize']
	1019	if 'maxchainlen' in opts:
	1020	self._maxchainlen = opts['maxchainlen']
	1021	if 'deltabothparents' in opts:
	1022	self._deltabothparents = opts['deltabothparents']
	1023	self._lazydeltabase = bool(opts.get('lazydeltabase', False))
	1024	if 'compengine' in opts:
	1025	self._compengine = opts['compengine']
	1026	if 'maxdeltachainspan' in opts:
	1027	self._maxdeltachainspan = opts['maxdeltachainspan']
	1028	if mmaplargeindex and 'mmapindexthreshold' in opts:
	1029	mmapindexthreshold = opts['mmapindexthreshold']
	1030	self._sparserevlog = bool(opts.get('sparse-revlog', False))
	1031	withsparseread = bool(opts.get('with-sparse-read', False))
	1032	# sparse-revlog forces sparse-read
	1033	self._withsparseread = self._sparserevlog or withsparseread
	1034	if 'sparse-read-density-threshold' in opts:
	1035	self._srdensitythreshold = opts['sparse-read-density-threshold']
	1036	if 'sparse-read-min-gap-size' in opts:
	1037	self._srmingapsize = opts['sparse-read-min-gap-size']
	1038
	1039	if self._chunkcachesize <= 0:
	1040	raise RevlogError(_('revlog chunk cache size %r is not greater '
	1041	'than 0') % self._chunkcachesize)
	1042	elif self._chunkcachesize & (self._chunkcachesize - 1):
	1043	raise RevlogError(_('revlog chunk cache size %r is not a power '
	1044	'of 2') % self._chunkcachesize)
	1045
	1046	indexdata = ''
	1047	self._initempty = True
	1048	try:
	1049	with self._indexfp() as f:
	1050	if (mmapindexthreshold is not None and
	1051	self.opener.fstat(f).st_size >= mmapindexthreshold):
	1052	indexdata = util.buffer(util.mmapread(f))
	1053	else:
	1054	indexdata = f.read()
	1055	if len(indexdata) > 0:
	1056	v = versionformat_unpack(indexdata[:4])[0]
	1057	self._initempty = False
	1058	except IOError as inst:
	1059	if inst.errno != errno.ENOENT:
	1060	raise
	1061
	1062	self.version = v
	1063	self._inline = v & FLAG_INLINE_DATA
	1064	self._generaldelta = v & FLAG_GENERALDELTA
	1065	flags = v & ~0xFFFF
	1066	fmt = v & 0xFFFF
	1067	if fmt == REVLOGV0:
	1068	if flags:
	1069	raise RevlogError(_('unknown flags (%#04x) in version %d '
	1070	'revlog %s') %
	1071	(flags >> 16, fmt, self.indexfile))
	1072	elif fmt == REVLOGV1:
	1073	if flags & ~REVLOGV1_FLAGS:
	1074	raise RevlogError(_('unknown flags (%#04x) in version %d '
	1075	'revlog %s') %
	1076	(flags >> 16, fmt, self.indexfile))
	1077	elif fmt == REVLOGV2:
	1078	if flags & ~REVLOGV2_FLAGS:
	1079	raise RevlogError(_('unknown flags (%#04x) in version %d '
	1080	'revlog %s') %
	1081	(flags >> 16, fmt, self.indexfile))
	1082	else:
	1083	raise RevlogError(_('unknown version (%d) in revlog %s') %
	1084	(fmt, self.indexfile))
	1085
	1086	self._storedeltachains = True
	1087
	1088	self._io = revlogio()
	1089	if self.version == REVLOGV0:
	1090	self._io = revlogoldio()
	1091	try:
	1092	d = self._io.parseindex(indexdata, self._inline)
	1093	except (ValueError, IndexError):
	1094	raise RevlogError(_("index %s is corrupted") % (self.indexfile))
	1095	self.index, nodemap, self._chunkcache = d
	1096	if nodemap is not None:
	1097	self.nodemap = self._nodecache = nodemap
	1098	if not self._chunkcache:
	1099	self._chunkclear()
	1100	# revnum -> (chain-length, sum-delta-length)
	1101	self._chaininfocache = {}
	1102	# revlog header -> revlog compressor
	1103	self._decompressors = {}
	1104
	1105	@util.propertycache
	1106	def _compressor(self):
	1107	return util.compengines[self._compengine].revlogcompressor()
	1108
	1109	def _indexfp(self, mode='r'):
	1110	"""file object for the revlog's index file"""
	1111	args = {r'mode': mode}
	1112	if mode != 'r':
	1113	args[r'checkambig'] = self._checkambig
	1114	if mode == 'w':
	1115	args[r'atomictemp'] = True
	1116	return self.opener(self.indexfile, **args)
	1117
	1118	def _datafp(self, mode='r'):
	1119	"""file object for the revlog's data file"""
	1120	return self.opener(self.datafile, mode=mode)
	1121
	1122	@contextlib.contextmanager
	1123	def _datareadfp(self, existingfp=None):
	1124	"""file object suitable to read data"""
	1125	if existingfp is not None:
	1126	yield existingfp
	1127	else:
	1128	if self._inline:
	1129	func = self._indexfp
	1130	else:
	1131	func = self._datafp
	1132	with func() as fp:
	1133	yield fp
	1134
	1135	def tip(self):
	1136	return self.node(len(self.index) - 1)
	1137	def __contains__(self, rev):
	1138	return 0 <= rev < len(self)
	1139	def __len__(self):
	1140	return len(self.index)
	1141	def __iter__(self):
	1142	return iter(pycompat.xrange(len(self)))
	1143	def revs(self, start=0, stop=None):
	1144	"""iterate over all rev in this revlog (from start to stop)"""
	1145	step = 1
	1146	length = len(self)
	1147	if stop is not None:
	1148	if start > stop:
	1149	step = -1
	1150	stop += step
	1151	if stop > length:
	1152	stop = length
	1153	else:
	1154	stop = length
	1155	return pycompat.xrange(start, stop, step)
	1156
	1157	@util.propertycache
	1158	def nodemap(self):
	1159	if self.index:
	1160	# populate mapping down to the initial node
	1161	node0 = self.index[0][7] # get around changelog filtering
	1162	self.rev(node0)
	1163	return self._nodecache
	1164
	1165	def hasnode(self, node):
	1166	try:
	1167	self.rev(node)
	1168	return True
	1169	except KeyError:
	1170	return False
	1171
	1172	def candelta(self, baserev, rev):
	1173	"""whether two revisions (baserev, rev) can be delta-ed or not"""
	1174	# Disable delta if either rev requires a content-changing flag
	1175	# processor (ex. LFS). This is because such flag processor can alter
	1176	# the rawtext content that the delta will be based on, and two clients
	1177	# could have a same revlog node with different flags (i.e. different
	1178	# rawtext contents) and the delta could be incompatible.
	1179	if ((self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS)
	1180	or (self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS)):
	1181	return False
	1182	return True
	1183
	1184	def clearcaches(self):
	1185	self._cache = None
	1186	self._chainbasecache.clear()
	1187	self._chunkcache = (0, '')
	1188	self._pcache = {}
	1189
	1190	try:
	1191	self._nodecache.clearcaches()
	1192	except AttributeError:
	1193	self._nodecache = {nullid: nullrev}
	1194	self._nodepos = None
	1195
	1196	def rev(self, node):
	1197	try:
	1198	return self._nodecache[node]
	1199	except TypeError:
	1200	raise
	1201	except RevlogError:
	1202	# parsers.c radix tree lookup failed
	1203	if node == wdirid or node in wdirfilenodeids:
	1204	raise error.WdirUnsupported
	1205	raise LookupError(node, self.indexfile, _('no node'))
	1206	except KeyError:
	1207	# pure python cache lookup failed
	1208	n = self._nodecache
	1209	i = self.index
	1210	p = self._nodepos
	1211	if p is None:
	1212	p = len(i) - 1
	1213	else:
	1214	assert p < len(i)
	1215	for r in pycompat.xrange(p, -1, -1):
	1216	v = i[r][7]
	1217	n[v] = r
	1218	if v == node:
	1219	self._nodepos = r - 1
	1220	return r
	1221	if node == wdirid or node in wdirfilenodeids:
	1222	raise error.WdirUnsupported
	1223	raise LookupError(node, self.indexfile, _('no node'))
	1224
	1225	# Accessors for index entries.
	1226
	1227	# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
	1228	# are flags.
	1229	def start(self, rev):
	1230	return int(self.index[rev][0] >> 16)
	1231
	1232	def flags(self, rev):
	1233	return self.index[rev][0] & 0xFFFF
	1234
	1235	def length(self, rev):
	1236	return self.index[rev][1]
	1237
	1238	def rawsize(self, rev):
	1239	"""return the length of the uncompressed text for a given revision"""
	1240	l = self.index[rev][2]
	1241	if l >= 0:
	1242	return l
	1243
	1244	t = self.revision(rev, raw=True)
	1245	return len(t)
	1246
	1247	def size(self, rev):
	1248	"""length of non-raw text (processed by a "read" flag processor)"""
	1249	# fast path: if no "read" flag processor could change the content,
	1250	# size is rawsize. note: ELLIPSIS is known to not change the content.
	1251	flags = self.flags(rev)
	1252	if flags & (REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
	1253	return self.rawsize(rev)
	1254
	1255	return len(self.revision(rev, raw=False))
	1256
	1257	def chainbase(self, rev):
	1258	base = self._chainbasecache.get(rev)
	1259	if base is not None:
	1260	return base
	1261
	1262	index = self.index
	1263	iterrev = rev
	1264	base = index[iterrev][3]
	1265	while base != iterrev:
	1266	iterrev = base
	1267	base = index[iterrev][3]
	1268
	1269	self._chainbasecache[rev] = base
	1270	return base
	1271
	1272	def linkrev(self, rev):
	1273	return self.index[rev][4]
	1274
	1275	def parentrevs(self, rev):
	1276	try:
	1277	entry = self.index[rev]
	1278	except IndexError:
	1279	if rev == wdirrev:
	1280	raise error.WdirUnsupported
	1281	raise
	1282
	1283	return entry[5], entry[6]
	1284
	1285	def node(self, rev):
	1286	try:
	1287	return self.index[rev][7]
	1288	except IndexError:
	1289	if rev == wdirrev:
	1290	raise error.WdirUnsupported
	1291	raise
	1292
	1293	# Derived from index values.
	1294
	1295	def end(self, rev):
	1296	return self.start(rev) + self.length(rev)
	1297
	1298	def parents(self, node):
	1299	i = self.index
	1300	d = i[self.rev(node)]
	1301	return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
	1302
	1303	def chainlen(self, rev):
	1304	return self._chaininfo(rev)[0]
	1305
	1306	def _chaininfo(self, rev):
	1307	chaininfocache = self._chaininfocache
	1308	if rev in chaininfocache:
	1309	return chaininfocache[rev]
	1310	index = self.index
	1311	generaldelta = self._generaldelta
	1312	iterrev = rev
	1313	e = index[iterrev]
	1314	clen = 0
	1315	compresseddeltalen = 0
	1316	while iterrev != e[3]:
	1317	clen += 1
	1318	compresseddeltalen += e[1]
	1319	if generaldelta:
	1320	iterrev = e[3]
	1321	else:
	1322	iterrev -= 1
	1323	if iterrev in chaininfocache:
	1324	t = chaininfocache[iterrev]
	1325	clen += t[0]
	1326	compresseddeltalen += t[1]
	1327	break
	1328	e = index[iterrev]
	1329	else:
	1330	# Add text length of base since decompressing that also takes
	1331	# work. For cache hits the length is already included.
	1332	compresseddeltalen += e[1]
	1333	r = (clen, compresseddeltalen)
	1334	chaininfocache[rev] = r
	1335	return r
	1336
	1337	def _deltachain(self, rev, stoprev=None):
	1338	"""Obtain the delta chain for a revision.
	1339
	1340	``stoprev`` specifies a revision to stop at. If not specified, we
	1341	stop at the base of the chain.
	1342
	1343	Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
	1344	revs in ascending order and ``stopped`` is a bool indicating whether
	1345	``stoprev`` was hit.
	1346	"""
	1347	# Try C implementation.
	1348	try:
	1349	return self.index.deltachain(rev, stoprev, self._generaldelta)
	1350	except AttributeError:
	1351	pass
	1352
	1353	chain = []
	1354
	1355	# Alias to prevent attribute lookup in tight loop.
	1356	index = self.index
	1357	generaldelta = self._generaldelta
	1358
	1359	iterrev = rev
	1360	e = index[iterrev]
	1361	while iterrev != e[3] and iterrev != stoprev:
	1362	chain.append(iterrev)
	1363	if generaldelta:
	1364	iterrev = e[3]
	1365	else:
	1366	iterrev -= 1
	1367	e = index[iterrev]
	1368
	1369	if iterrev == stoprev:
	1370	stopped = True
	1371	else:
	1372	chain.append(iterrev)
	1373	stopped = False
	1374
	1375	chain.reverse()
	1376	return chain, stopped
	1377
	1378	def ancestors(self, revs, stoprev=0, inclusive=False):
	1379	"""Generate the ancestors of 'revs' in reverse topological order.
	1380	Does not generate revs lower than stoprev.
	1381
	1382	See the documentation for ancestor.lazyancestors for more details."""
	1383
	1384	return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,
	1385	inclusive=inclusive)
	1386
	1387	def descendants(self, revs):
	1388	"""Generate the descendants of 'revs' in revision order.
	1389
	1390	Yield a sequence of revision numbers starting with a child of
	1391	some rev in revs, i.e., each revision is not considered a
	1392	descendant of itself. Results are ordered by revision number (a
	1393	topological sort)."""
	1394	first = min(revs)
	1395	if first == nullrev:
	1396	for i in self:
	1397	yield i
	1398	return
	1399
	1400	seen = set(revs)
	1401	for i in self.revs(start=first + 1):
	1402	for x in self.parentrevs(i):
	1403	if x != nullrev and x in seen:
	1404	seen.add(i)
	1405	yield i
	1406	break
	1407
	1408	def findcommonmissing(self, common=None, heads=None):
	1409	"""Return a tuple of the ancestors of common and the ancestors of heads
	1410	that are not ancestors of common. In revset terminology, we return the
	1411	tuple:
	1412
	1413	::common, (::heads) - (::common)
	1414
	1415	The list is sorted by revision number, meaning it is
	1416	topologically sorted.
	1417
	1418	'heads' and 'common' are both lists of node IDs. If heads is
	1419	not supplied, uses all of the revlog's heads. If common is not
	1420	supplied, uses nullid."""
	1421	if common is None:
	1422	common = [nullid]
	1423	if heads is None:
	1424	heads = self.heads()
	1425
	1426	common = [self.rev(n) for n in common]
	1427	heads = [self.rev(n) for n in heads]
	1428
	1429	# we want the ancestors, but inclusive
	1430	class lazyset(object):
	1431	def __init__(self, lazyvalues):
	1432	self.addedvalues = set()
	1433	self.lazyvalues = lazyvalues
	1434
	1435	def __contains__(self, value):
	1436	return value in self.addedvalues or value in self.lazyvalues
	1437
	1438	def __iter__(self):
	1439	added = self.addedvalues
	1440	for r in added:
	1441	yield r
	1442	for r in self.lazyvalues:
	1443	if not r in added:
	1444	yield r
	1445
	1446	def add(self, value):
	1447	self.addedvalues.add(value)
	1448
	1449	def update(self, values):
	1450	self.addedvalues.update(values)
	1451
	1452	has = lazyset(self.ancestors(common))
	1453	has.add(nullrev)
	1454	has.update(common)
	1455
	1456	# take all ancestors from heads that aren't in has
	1457	missing = set()
	1458	visit = collections.deque(r for r in heads if r not in has)
	1459	while visit:
	1460	r = visit.popleft()
	1461	if r in missing:
	1462	continue
	1463	else:
	1464	missing.add(r)
	1465	for p in self.parentrevs(r):
	1466	if p not in has:
	1467	visit.append(p)
	1468	missing = list(missing)
	1469	missing.sort()
	1470	return has, [self.node(miss) for miss in missing]
	1471
	1472	def incrementalmissingrevs(self, common=None):
	1473	"""Return an object that can be used to incrementally compute the
	1474	revision numbers of the ancestors of arbitrary sets that are not
	1475	ancestors of common. This is an ancestor.incrementalmissingancestors
	1476	object.
	1477
	1478	'common' is a list of revision numbers. If common is not supplied, uses
	1479	nullrev.
	1480	"""
	1481	if common is None:
	1482	common = [nullrev]
	1483
	1484	return ancestor.incrementalmissingancestors(self.parentrevs, common)
	1485
	1486	def findmissingrevs(self, common=None, heads=None):
	1487	"""Return the revision numbers of the ancestors of heads that
	1488	are not ancestors of common.
	1489
	1490	More specifically, return a list of revision numbers corresponding to
	1491	nodes N such that every N satisfies the following constraints:
	1492
	1493	1. N is an ancestor of some node in 'heads'
	1494	2. N is not an ancestor of any node in 'common'
	1495
	1496	The list is sorted by revision number, meaning it is
	1497	topologically sorted.
	1498
	1499	'heads' and 'common' are both lists of revision numbers. If heads is
	1500	not supplied, uses all of the revlog's heads. If common is not
	1501	supplied, uses nullid."""
	1502	if common is None:
	1503	common = [nullrev]
	1504	if heads is None:
	1505	heads = self.headrevs()
	1506
	1507	inc = self.incrementalmissingrevs(common=common)
	1508	return inc.missingancestors(heads)
	1509
	1510	def findmissing(self, common=None, heads=None):
	1511	"""Return the ancestors of heads that are not ancestors of common.
	1512
	1513	More specifically, return a list of nodes N such that every N
	1514	satisfies the following constraints:
	1515
	1516	1. N is an ancestor of some node in 'heads'
	1517	2. N is not an ancestor of any node in 'common'
	1518
	1519	The list is sorted by revision number, meaning it is
	1520	topologically sorted.
	1521
	1522	'heads' and 'common' are both lists of node IDs. If heads is
	1523	not supplied, uses all of the revlog's heads. If common is not
	1524	supplied, uses nullid."""
	1525	if common is None:
	1526	common = [nullid]
	1527	if heads is None:
	1528	heads = self.heads()
	1529
	1530	common = [self.rev(n) for n in common]
	1531	heads = [self.rev(n) for n in heads]
	1532
	1533	inc = self.incrementalmissingrevs(common=common)
	1534	return [self.node(r) for r in inc.missingancestors(heads)]
	1535
	1536	def nodesbetween(self, roots=None, heads=None):
	1537	"""Return a topological path from 'roots' to 'heads'.
	1538
	1539	Return a tuple (nodes, outroots, outheads) where 'nodes' is a
	1540	topologically sorted list of all nodes N that satisfy both of
	1541	these constraints:
	1542
	1543	1. N is a descendant of some node in 'roots'
	1544	2. N is an ancestor of some node in 'heads'
	1545
	1546	Every node is considered to be both a descendant and an ancestor
	1547	of itself, so every reachable node in 'roots' and 'heads' will be
	1548	included in 'nodes'.
	1549
	1550	'outroots' is the list of reachable nodes in 'roots', i.e., the
	1551	subset of 'roots' that is returned in 'nodes'. Likewise,
	1552	'outheads' is the subset of 'heads' that is also in 'nodes'.
	1553
	1554	'roots' and 'heads' are both lists of node IDs. If 'roots' is
	1555	unspecified, uses nullid as the only root. If 'heads' is
	1556	unspecified, uses list of all of the revlog's heads."""
	1557	nonodes = ([], [], [])
	1558	if roots is not None:
	1559	roots = list(roots)
	1560	if not roots:
	1561	return nonodes
	1562	lowestrev = min([self.rev(n) for n in roots])
	1563	else:
	1564	roots = [nullid] # Everybody's a descendant of nullid
	1565	lowestrev = nullrev
	1566	if (lowestrev == nullrev) and (heads is None):
	1567	# We want _all_ the nodes!
	1568	return ([self.node(r) for r in self], [nullid], list(self.heads()))
	1569	if heads is None:
	1570	# All nodes are ancestors, so the latest ancestor is the last
	1571	# node.
	1572	highestrev = len(self) - 1
	1573	# Set ancestors to None to signal that every node is an ancestor.
	1574	ancestors = None
	1575	# Set heads to an empty dictionary for later discovery of heads
	1576	heads = {}
	1577	else:
	1578	heads = list(heads)
	1579	if not heads:
	1580	return nonodes
	1581	ancestors = set()
	1582	# Turn heads into a dictionary so we can remove 'fake' heads.
	1583	# Also, later we will be using it to filter out the heads we can't
	1584	# find from roots.
	1585	heads = dict.fromkeys(heads, False)
	1586	# Start at the top and keep marking parents until we're done.
	1587	nodestotag = set(heads)
	1588	# Remember where the top was so we can use it as a limit later.
	1589	highestrev = max([self.rev(n) for n in nodestotag])
	1590	while nodestotag:
	1591	# grab a node to tag
	1592	n = nodestotag.pop()
	1593	# Never tag nullid
	1594	if n == nullid:
	1595	continue
	1596	# A node's revision number represents its place in a
	1597	# topologically sorted list of nodes.
	1598	r = self.rev(n)
	1599	if r >= lowestrev:
	1600	if n not in ancestors:
	1601	# If we are possibly a descendant of one of the roots
	1602	# and we haven't already been marked as an ancestor
	1603	ancestors.add(n) # Mark as ancestor
	1604	# Add non-nullid parents to list of nodes to tag.
	1605	nodestotag.update([p for p in self.parents(n) if
	1606	p != nullid])
	1607	elif n in heads: # We've seen it before, is it a fake head?
	1608	# So it is, real heads should not be the ancestors of
	1609	# any other heads.
	1610	heads.pop(n)
	1611	if not ancestors:
	1612	return nonodes
	1613	# Now that we have our set of ancestors, we want to remove any
	1614	# roots that are not ancestors.
	1615
	1616	# If one of the roots was nullid, everything is included anyway.
	1617	if lowestrev > nullrev:
	1618	# But, since we weren't, let's recompute the lowest rev to not
	1619	# include roots that aren't ancestors.
	1620
	1621	# Filter out roots that aren't ancestors of heads
	1622	roots = [root for root in roots if root in ancestors]
	1623	# Recompute the lowest revision
	1624	if roots:
	1625	lowestrev = min([self.rev(root) for root in roots])
	1626	else:
	1627	# No more roots? Return empty list
	1628	return nonodes
	1629	else:
	1630	# We are descending from nullid, and don't need to care about
	1631	# any other roots.
	1632	lowestrev = nullrev
	1633	roots = [nullid]
	1634	# Transform our roots list into a set.
	1635	descendants = set(roots)
	1636	# Also, keep the original roots so we can filter out roots that aren't
	1637	# 'real' roots (i.e. are descended from other roots).
	1638	roots = descendants.copy()
	1639	# Our topologically sorted list of output nodes.
	1640	orderedout = []
	1641	# Don't start at nullid since we don't want nullid in our output list,
	1642	# and if nullid shows up in descendants, empty parents will look like
	1643	# they're descendants.
	1644	for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
	1645	n = self.node(r)
	1646	isdescendant = False
	1647	if lowestrev == nullrev: # Everybody is a descendant of nullid
	1648	isdescendant = True
	1649	elif n in descendants:
	1650	# n is already a descendant
	1651	isdescendant = True
	1652	# This check only needs to be done here because all the roots
	1653	# will start being marked is descendants before the loop.
	1654	if n in roots:
	1655	# If n was a root, check if it's a 'real' root.
	1656	p = tuple(self.parents(n))
	1657	# If any of its parents are descendants, it's not a root.
	1658	if (p[0] in descendants) or (p[1] in descendants):
	1659	roots.remove(n)
	1660	else:
	1661	p = tuple(self.parents(n))
	1662	# A node is a descendant if either of its parents are
	1663	# descendants. (We seeded the dependents list with the roots
	1664	# up there, remember?)
	1665	if (p[0] in descendants) or (p[1] in descendants):
	1666	descendants.add(n)
	1667	isdescendant = True
	1668	if isdescendant and ((ancestors is None) or (n in ancestors)):
	1669	# Only include nodes that are both descendants and ancestors.
	1670	orderedout.append(n)
	1671	if (ancestors is not None) and (n in heads):
	1672	# We're trying to figure out which heads are reachable
	1673	# from roots.
	1674	# Mark this head as having been reached
	1675	heads[n] = True
	1676	elif ancestors is None:
	1677	# Otherwise, we're trying to discover the heads.
	1678	# Assume this is a head because if it isn't, the next step
	1679	# will eventually remove it.
	1680	heads[n] = True
	1681	# But, obviously its parents aren't.
	1682	for p in self.parents(n):
	1683	heads.pop(p, None)
	1684	heads = [head for head, flag in heads.iteritems() if flag]
	1685	roots = list(roots)
	1686	assert orderedout
	1687	assert roots
	1688	assert heads
	1689	return (orderedout, roots, heads)
	1690
	1691	def headrevs(self):
	1692	try:
	1693	return self.index.headrevs()
	1694	except AttributeError:
	1695	return self._headrevs()
	1696
	1697	def computephases(self, roots):
	1698	return self.index.computephasesmapsets(roots)
	1699
	1700	def _headrevs(self):
	1701	count = len(self)
	1702	if not count:
	1703	return [nullrev]
	1704	# we won't iter over filtered rev so nobody is a head at start
	1705	ishead = [0] * (count + 1)
	1706	index = self.index
	1707	for r in self:
	1708	ishead[r] = 1 # I may be an head
	1709	e = index[r]
	1710	ishead[e[5]] = ishead[e[6]] = 0 # my parent are not
	1711	return [r for r, val in enumerate(ishead) if val]
	1712
	1713	def heads(self, start=None, stop=None):
	1714	"""return the list of all nodes that have no children
	1715
	1716	if start is specified, only heads that are descendants of
	1717	start will be returned
	1718	if stop is specified, it will consider all the revs from stop
	1719	as if they had no children
	1720	"""
	1721	if start is None and stop is None:
	1722	if not len(self):
	1723	return [nullid]
	1724	return [self.node(r) for r in self.headrevs()]
	1725
	1726	if start is None:
	1727	start = nullid
	1728	if stop is None:
	1729	stop = []
	1730	stoprevs = set([self.rev(n) for n in stop])
	1731	startrev = self.rev(start)
	1732	reachable = {startrev}
	1733	heads = {startrev}
	1734
	1735	parentrevs = self.parentrevs
	1736	for r in self.revs(start=startrev + 1):
	1737	for p in parentrevs(r):
	1738	if p in reachable:
	1739	if r not in stoprevs:
	1740	reachable.add(r)
	1741	heads.add(r)
	1742	if p in heads and p not in stoprevs:
	1743	heads.remove(p)
	1744
	1745	return [self.node(r) for r in heads]
	1746
	1747	def children(self, node):
	1748	"""find the children of a given node"""
	1749	c = []
	1750	p = self.rev(node)
	1751	for r in self.revs(start=p + 1):
	1752	prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
	1753	if prevs:
	1754	for pr in prevs:
	1755	if pr == p:
	1756	c.append(self.node(r))
	1757	elif p == nullrev:
	1758	c.append(self.node(r))
	1759	return c
	1760
	1761	def commonancestorsheads(self, a, b):
	1762	"""calculate all the heads of the common ancestors of nodes a and b"""
	1763	a, b = self.rev(a), self.rev(b)
	1764	ancs = self._commonancestorsheads(a, b)
	1765	return pycompat.maplist(self.node, ancs)
	1766
	1767	def _commonancestorsheads(self, *revs):
	1768	"""calculate all the heads of the common ancestors of revs"""
	1769	try:
	1770	ancs = self.index.commonancestorsheads(*revs)
	1771	except (AttributeError, OverflowError): # C implementation failed
	1772	ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
	1773	return ancs
	1774
	1775	def isancestor(self, a, b):
	1776	"""return True if node a is an ancestor of node b
	1777
	1778	A revision is considered an ancestor of itself."""
	1779	a, b = self.rev(a), self.rev(b)
	1780	return self.isancestorrev(a, b)
	1781
	1782	def isancestorrev(self, a, b):
	1783	"""return True if revision a is an ancestor of revision b
	1784
	1785	A revision is considered an ancestor of itself.
	1786
	1787	The implementation of this is trivial but the use of
	1788	commonancestorsheads is not."""
	1789	if a == nullrev:
	1790	return True
	1791	elif a == b:
	1792	return True
	1793	elif a > b:
	1794	return False
	1795	return a in self._commonancestorsheads(a, b)
	1796
	1797	def ancestor(self, a, b):
	1798	"""calculate the "best" common ancestor of nodes a and b"""
	1799
	1800	a, b = self.rev(a), self.rev(b)
	1801	try:
	1802	ancs = self.index.ancestors(a, b)
	1803	except (AttributeError, OverflowError):
	1804	ancs = ancestor.ancestors(self.parentrevs, a, b)
	1805	if ancs:
	1806	# choose a consistent winner when there's a tie
	1807	return min(map(self.node, ancs))
	1808	return nullid
	1809
	1810	def _match(self, id):
	1811	if isinstance(id, int):
	1812	# rev
	1813	return self.node(id)
	1814	if len(id) == 20:
	1815	# possibly a binary node
	1816	# odds of a binary node being all hex in ASCII are 1 in 10**25
	1817	try:
	1818	node = id
	1819	self.rev(node) # quick search the index
	1820	return node
	1821	except LookupError:
	1822	pass # may be partial hex id
	1823	try:
	1824	# str(rev)
	1825	rev = int(id)
	1826	if "%d" % rev != id:
	1827	raise ValueError
	1828	if rev < 0:
	1829	rev = len(self) + rev
	1830	if rev < 0 or rev >= len(self):
	1831	raise ValueError
	1832	return self.node(rev)
	1833	except (ValueError, OverflowError):
	1834	pass
	1835	if len(id) == 40:
	1836	try:
	1837	# a full hex nodeid?
	1838	node = bin(id)
	1839	self.rev(node)
	1840	return node
	1841	except (TypeError, LookupError):
	1842	pass
	1843
	1844	def _partialmatch(self, id):
	1845	# we don't care wdirfilenodeids as they should be always full hash
	1846	maybewdir = wdirhex.startswith(id)
	1847	try:
	1848	partial = self.index.partialmatch(id)
	1849	if partial and self.hasnode(partial):
	1850	if maybewdir:
	1851	# single 'ff...' match in radix tree, ambiguous with wdir
	1852	raise RevlogError
	1853	return partial
	1854	if maybewdir:
	1855	# no 'ff...' match in radix tree, wdir identified
	1856	raise error.WdirUnsupported
	1857	return None
	1858	except RevlogError:
	1859	# parsers.c radix tree lookup gave multiple matches
	1860	# fast path: for unfiltered changelog, radix tree is accurate
	1861	if not getattr(self, 'filteredrevs', None):
	1862	raise AmbiguousPrefixLookupError(id, self.indexfile,
	1863	_('ambiguous identifier'))
	1864	# fall through to slow path that filters hidden revisions
	1865	except (AttributeError, ValueError):
	1866	# we are pure python, or key was too short to search radix tree
	1867	pass
	1868
	1869	if id in self._pcache:
	1870	return self._pcache[id]
	1871
	1872	if len(id) <= 40:
	1873	try:
	1874	# hex(node)[:...]
	1875	l = len(id) // 2 # grab an even number of digits
	1876	prefix = bin(id[:l * 2])
	1877	nl = [e[7] for e in self.index if e[7].startswith(prefix)]
	1878	nl = [n for n in nl if hex(n).startswith(id) and
	1879	self.hasnode(n)]
	1880	if nullhex.startswith(id):
	1881	nl.append(nullid)
	1882	if len(nl) > 0:
	1883	if len(nl) == 1 and not maybewdir:
	1884	self._pcache[id] = nl[0]
	1885	return nl[0]
	1886	raise AmbiguousPrefixLookupError(id, self.indexfile,
	1887	_('ambiguous identifier'))
	1888	if maybewdir:
	1889	raise error.WdirUnsupported
	1890	return None
	1891	except TypeError:
	1892	pass
	1893
	1894	def lookup(self, id):
	1895	"""locate a node based on:
	1896	- revision number or str(revision number)
	1897	- nodeid or subset of hex nodeid
	1898	"""
	1899	n = self._match(id)
	1900	if n is not None:
	1901	return n
	1902	n = self._partialmatch(id)
	1903	if n:
	1904	return n
	1905
	1906	raise LookupError(id, self.indexfile, _('no match found'))
	1907
	1908	def shortest(self, node, minlength=1):
	1909	"""Find the shortest unambiguous prefix that matches node."""
	1910	def isvalid(prefix):
	1911	try:
	1912	node = self._partialmatch(prefix)
	1913	except error.RevlogError:
	1914	return False
	1915	except error.WdirUnsupported:
	1916	# single 'ff...' match
	1917	return True
	1918	if node is None:
	1919	raise LookupError(node, self.indexfile, _('no node'))
	1920	return True
	1921
	1922	def maybewdir(prefix):
	1923	return all(c == 'f' for c in prefix)
	1924
	1925	hexnode = hex(node)
	1926
	1927	def disambiguate(hexnode, minlength):
	1928	"""Disambiguate against wdirid."""
	1929	for length in range(minlength, 41):
	1930	prefix = hexnode[:length]
	1931	if not maybewdir(prefix):
	1932	return prefix
	1933
	1934	if not getattr(self, 'filteredrevs', None):
	1935	try:
	1936	length = max(self.index.shortest(node), minlength)
	1937	return disambiguate(hexnode, length)
	1938	except RevlogError:
	1939	if node != wdirid:
	1940	raise LookupError(node, self.indexfile, _('no node'))
	1941	except AttributeError:
	1942	# Fall through to pure code
	1943	pass
	1944
	1945	if node == wdirid:
	1946	for length in range(minlength, 41):
	1947	prefix = hexnode[:length]
	1948	if isvalid(prefix):
	1949	return prefix
	1950
	1951	for length in range(minlength, 41):
	1952	prefix = hexnode[:length]
	1953	if isvalid(prefix):
	1954	return disambiguate(hexnode, length)
	1955
	1956	def cmp(self, node, text):
	1957	"""compare text with a given file revision
	1958
	1959	returns True if text is different than what is stored.
	1960	"""
	1961	p1, p2 = self.parents(node)
	1962	return hash(text, p1, p2) != node
	1963
	1964	def _cachesegment(self, offset, data):
	1965	"""Add a segment to the revlog cache.
	1966
	1967	Accepts an absolute offset and the data that is at that location.
	1968	"""
	1969	o, d = self._chunkcache
	1970	# try to add to existing cache
	1971	if o + len(d) == offset and len(d) + len(data) < _chunksize:
	1972	self._chunkcache = o, d + data
	1973	else:
	1974	self._chunkcache = offset, data
	1975
	1976	def _readsegment(self, offset, length, df=None):
	1977	"""Load a segment of raw data from the revlog.
	1978
	1979	Accepts an absolute offset, length to read, and an optional existing
	1980	file handle to read from.
	1981
	1982	If an existing file handle is passed, it will be seeked and the
	1983	original seek position will NOT be restored.
	1984
	1985	Returns a str or buffer of raw byte data.
	1986	"""
	1987	# Cache data both forward and backward around the requested
	1988	# data, in a fixed size window. This helps speed up operations
	1989	# involving reading the revlog backwards.
	1990	cachesize = self._chunkcachesize
	1991	realoffset = offset & ~(cachesize - 1)
	1992	reallength = (((offset + length + cachesize) & ~(cachesize - 1))
	1993	- realoffset)
	1994	with self._datareadfp(df) as df:
	1995	df.seek(realoffset)
	1996	d = df.read(reallength)
	1997	self._cachesegment(realoffset, d)
	1998	if offset != realoffset or reallength != length:
	1999	return util.buffer(d, offset - realoffset, length)
	2000	return d
	2001
	2002	def _getsegment(self, offset, length, df=None):
	2003	"""Obtain a segment of raw data from the revlog.
	2004
	2005	Accepts an absolute offset, length of bytes to obtain, and an
	2006	optional file handle to the already-opened revlog. If the file
	2007	handle is used, it's original seek position will not be preserved.
	2008
	2009	Requests for data may be returned from a cache.
	2010
	2011	Returns a str or a buffer instance of raw byte data.
	2012	"""
	2013	o, d = self._chunkcache
	2014	l = len(d)
	2015
	2016	# is it in the cache?
	2017	cachestart = offset - o
	2018	cacheend = cachestart + length
	2019	if cachestart >= 0 and cacheend <= l:
	2020	if cachestart == 0 and cacheend == l:
	2021	return d # avoid a copy
	2022	return util.buffer(d, cachestart, cacheend - cachestart)
	2023
	2024	return self._readsegment(offset, length, df=df)
	2025
	2026	def _getsegmentforrevs(self, startrev, endrev, df=None):
	2027	"""Obtain a segment of raw data corresponding to a range of revisions.
	2028
	2029	Accepts the start and end revisions and an optional already-open
	2030	file handle to be used for reading. If the file handle is read, its
	2031	seek position will not be preserved.
	2032
	2033	Requests for data may be satisfied by a cache.
	2034
	2035	Returns a 2-tuple of (offset, data) for the requested range of
	2036	revisions. Offset is the integer offset from the beginning of the
	2037	revlog and data is a str or buffer of the raw byte data.
	2038
	2039	Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
	2040	to determine where each revision's data begins and ends.
	2041	"""
	2042	# Inlined self.start(startrev) & self.end(endrev) for perf reasons
	2043	# (functions are expensive).
	2044	index = self.index
	2045	istart = index[startrev]
	2046	start = int(istart[0] >> 16)
	2047	if startrev == endrev:
	2048	end = start + istart[1]
	2049	else:
	2050	iend = index[endrev]
	2051	end = int(iend[0] >> 16) + iend[1]
	2052
	2053	if self._inline:
	2054	start += (startrev + 1) * self._io.size
	2055	end += (endrev + 1) * self._io.size
	2056	length = end - start
	2057
	2058	return start, self._getsegment(start, length, df=df)
	2059
	2060	def _chunk(self, rev, df=None):
	2061	"""Obtain a single decompressed chunk for a revision.
	2062
	2063	Accepts an integer revision and an optional already-open file handle
	2064	to be used for reading. If used, the seek position of the file will not
	2065	be preserved.
	2066
	2067	Returns a str holding uncompressed data for the requested revision.
	2068	"""
	2069	return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])
	2070
	2071	def _chunks(self, revs, df=None, targetsize=None):
	2072	"""Obtain decompressed chunks for the specified revisions.
	2073
	2074	Accepts an iterable of numeric revisions that are assumed to be in
	2075	ascending order. Also accepts an optional already-open file handle
	2076	to be used for reading. If used, the seek position of the file will
	2077	not be preserved.
	2078
	2079	This function is similar to calling ``self._chunk()`` multiple times,
	2080	but is faster.
	2081
	2082	Returns a list with decompressed data for each requested revision.
	2083	"""
	2084	if not revs:
	2085	return []
	2086	start = self.start
	2087	length = self.length
	2088	inline = self._inline
	2089	iosize = self._io.size
	2090	buffer = util.buffer
	2091
	2092	l = []
	2093	ladd = l.append
	2094
	2095	if not self._withsparseread:
	2096	slicedchunks = (revs,)
	2097	else:
	2098	slicedchunks = _slicechunk(self, revs, targetsize=targetsize)
	2099
	2100	for revschunk in slicedchunks:
	2101	firstrev = revschunk[0]
	2102	# Skip trailing revisions with empty diff
	2103	for lastrev in revschunk[::-1]:
	2104	if length(lastrev) != 0:
	2105	break
	2106
	2107	try:
	2108	offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)
	2109	except OverflowError:
	2110	# issue4215 - we can't cache a run of chunks greater than
	2111	# 2G on Windows
	2112	return [self._chunk(rev, df=df) for rev in revschunk]
	2113
	2114	decomp = self.decompress
	2115	for rev in revschunk:
	2116	chunkstart = start(rev)
	2117	if inline:
	2118	chunkstart += (rev + 1) * iosize
	2119	chunklength = length(rev)
	2120	ladd(decomp(buffer(data, chunkstart - offset, chunklength)))
	2121
	2122	return l
	2123
	2124	def _chunkclear(self):
	2125	"""Clear the raw chunk cache."""
	2126	self._chunkcache = (0, '')
	2127
	2128	def deltaparent(self, rev):
	2129	"""return deltaparent of the given revision"""
	2130	base = self.index[rev][3]
	2131	if base == rev:
	2132	return nullrev
	2133	elif self._generaldelta:
	2134	return base
	2135	else:
	2136	return rev - 1
	2137
	2138	def issnapshot(self, rev):
	2139	"""tells whether rev is a snapshot
	2140	"""
	2141	if rev == nullrev:
	2142	return True
	2143	deltap = self.deltaparent(rev)
	2144	if deltap == nullrev:
	2145	return True
	2146	p1, p2 = self.parentrevs(rev)
	2147	if deltap in (p1, p2):
	2148	return False
	2149	return self.issnapshot(deltap)
	2150
	2151	def snapshotdepth(self, rev):
	2152	"""number of snapshot in the chain before this one"""
	2153	if not self.issnapshot(rev):
	2154	raise ProgrammingError('revision %d not a snapshot')
	2155	return len(self._deltachain(rev)[0]) - 1
	2156
	2157	def revdiff(self, rev1, rev2):
	2158	"""return or calculate a delta between two revisions
	2159
	2160	The delta calculated is in binary form and is intended to be written to
	2161	revlog data directly. So this function needs raw revision data.
	2162	"""
	2163	if rev1 != nullrev and self.deltaparent(rev2) == rev1:
	2164	return bytes(self._chunk(rev2))
	2165
	2166	return mdiff.textdiff(self.revision(rev1, raw=True),
	2167	self.revision(rev2, raw=True))
	2168
	2169	def revision(self, nodeorrev, _df=None, raw=False):
	2170	"""return an uncompressed revision of a given node or revision
	2171	number.
	2172
	2173	_df - an existing file handle to read from. (internal-only)
	2174	raw - an optional argument specifying if the revision data is to be
	2175	treated as raw data when applying flag transforms. 'raw' should be set
	2176	to True when generating changegroups or in debug commands.
	2177	"""
	2178	if isinstance(nodeorrev, int):
	2179	rev = nodeorrev
	2180	node = self.node(rev)
	2181	else:
	2182	node = nodeorrev
	2183	rev = None
	2184
	2185	cachedrev = None
	2186	flags = None
	2187	rawtext = None
	2188	if node == nullid:
	2189	return ""
	2190	if self._cache:
	2191	if self._cache[0] == node:
	2192	# _cache only stores rawtext
	2193	if raw:
	2194	return self._cache[2]
	2195	# duplicated, but good for perf
	2196	if rev is None:
	2197	rev = self.rev(node)
	2198	if flags is None:
	2199	flags = self.flags(rev)
	2200	# no extra flags set, no flag processor runs, text = rawtext
	2201	if flags == REVIDX_DEFAULT_FLAGS:
	2202	return self._cache[2]
	2203	# rawtext is reusable. need to run flag processor
	2204	rawtext = self._cache[2]
	2205
	2206	cachedrev = self._cache[1]
	2207
	2208	# look up what we need to read
	2209	if rawtext is None:
	2210	if rev is None:
	2211	rev = self.rev(node)
	2212
	2213	chain, stopped = self._deltachain(rev, stoprev=cachedrev)
	2214	if stopped:
	2215	rawtext = self._cache[2]
	2216
	2217	# drop cache to save memory
	2218	self._cache = None
	2219
	2220	targetsize = None
	2221	rawsize = self.index[rev][2]
	2222	if 0 <= rawsize:
	2223	targetsize = 4 * rawsize
	2224
	2225	bins = self._chunks(chain, df=_df, targetsize=targetsize)
	2226	if rawtext is None:
	2227	rawtext = bytes(bins[0])
	2228	bins = bins[1:]
	2229
	2230	rawtext = mdiff.patches(rawtext, bins)
	2231	self._cache = (node, rev, rawtext)
	2232
	2233	if flags is None:
	2234	if rev is None:
	2235	rev = self.rev(node)
	2236	flags = self.flags(rev)
	2237
	2238	text, validatehash = self._processflags(rawtext, flags, 'read', raw=raw)
	2239	if validatehash:
	2240	self.checkhash(text, node, rev=rev)
	2241
	2242	return text
	2243
	2244	def hash(self, text, p1, p2):
	2245	"""Compute a node hash.
	2246
	2247	Available as a function so that subclasses can replace the hash
	2248	as needed.
	2249	"""
	2250	return hash(text, p1, p2)
	2251
	2252	def _processflags(self, text, flags, operation, raw=False):
	2253	"""Inspect revision data flags and applies transforms defined by
	2254	registered flag processors.
	2255
	2256	``text`` - the revision data to process
	2257	``flags`` - the revision flags
	2258	``operation`` - the operation being performed (read or write)
	2259	``raw`` - an optional argument describing if the raw transform should be
	2260	applied.
	2261
	2262	This method processes the flags in the order (or reverse order if
	2263	``operation`` is 'write') defined by REVIDX_FLAGS_ORDER, applying the
	2264	flag processors registered for present flags. The order of flags defined
	2265	in REVIDX_FLAGS_ORDER needs to be stable to allow non-commutativity.
	2266
	2267	Returns a 2-tuple of ``(text, validatehash)`` where ``text`` is the
	2268	processed text and ``validatehash`` is a bool indicating whether the
	2269	returned text should be checked for hash integrity.
	2270
	2271	Note: If the ``raw`` argument is set, it has precedence over the
	2272	operation and will only update the value of ``validatehash``.
	2273	"""
	2274	# fast path: no flag processors will run
	2275	if flags == 0:
	2276	return text, True
	2277	if not operation in ('read', 'write'):
	2278	raise ProgrammingError(_("invalid '%s' operation ") % (operation))
	2279	# Check all flags are known.
	2280	if flags & ~REVIDX_KNOWN_FLAGS:
	2281	raise RevlogError(_("incompatible revision flag '%#x'") %
	2282	(flags & ~REVIDX_KNOWN_FLAGS))
	2283	validatehash = True
	2284	# Depending on the operation (read or write), the order might be
	2285	# reversed due to non-commutative transforms.
	2286	orderedflags = REVIDX_FLAGS_ORDER
	2287	if operation == 'write':
	2288	orderedflags = reversed(orderedflags)
	2289
	2290	for flag in orderedflags:
	2291	# If a flagprocessor has been registered for a known flag, apply the
	2292	# related operation transform and update result tuple.
	2293	if flag & flags:
	2294	vhash = True
	2295
	2296	if flag not in _flagprocessors:
	2297	message = _("missing processor for flag '%#x'") % (flag)
	2298	raise RevlogError(message)
	2299
	2300	processor = _flagprocessors[flag]
	2301	if processor is not None:
	2302	readtransform, writetransform, rawtransform = processor
	2303
	2304	if raw:
	2305	vhash = rawtransform(self, text)
	2306	elif operation == 'read':
	2307	text, vhash = readtransform(self, text)
	2308	else: # write operation
	2309	text, vhash = writetransform(self, text)
	2310	validatehash = validatehash and vhash
	2311
	2312	return text, validatehash
	2313
	2314	def checkhash(self, text, node, p1=None, p2=None, rev=None):
	2315	"""Check node hash integrity.
	2316
	2317	Available as a function so that subclasses can extend hash mismatch
	2318	behaviors as needed.
	2319	"""
	2320	try:
	2321	if p1 is None and p2 is None:
	2322	p1, p2 = self.parents(node)
	2323	if node != self.hash(text, p1, p2):
	2324	revornode = rev
	2325	if revornode is None:
	2326	revornode = templatefilters.short(hex(node))
	2327	raise RevlogError(_("integrity check failed on %s:%s")
	2328	% (self.indexfile, pycompat.bytestr(revornode)))
	2329	except RevlogError:
	2330	if self._censorable and _censoredtext(text):
	2331	raise error.CensoredNodeError(self.indexfile, node, text)
	2332	raise
	2333
	2334	def _enforceinlinesize(self, tr, fp=None):
	2335	"""Check if the revlog is too big for inline and convert if so.
	2336
	2337	This should be called after revisions are added to the revlog. If the
	2338	revlog has grown too large to be an inline revlog, it will convert it
	2339	to use multiple index and data files.
	2340	"""
	2341	tiprev = len(self) - 1
	2342	if (not self._inline or
	2343	(self.start(tiprev) + self.length(tiprev)) < _maxinline):
	2344	return
	2345
	2346	trinfo = tr.find(self.indexfile)
	2347	if trinfo is None:
	2348	raise RevlogError(_("%s not found in the transaction")
	2349	% self.indexfile)
	2350
	2351	trindex = trinfo[2]
	2352	if trindex is not None:
	2353	dataoff = self.start(trindex)
	2354	else:
	2355	# revlog was stripped at start of transaction, use all leftover data
	2356	trindex = len(self) - 1
	2357	dataoff = self.end(tiprev)
	2358
	2359	tr.add(self.datafile, dataoff)
	2360
	2361	if fp:
	2362	fp.flush()
	2363	fp.close()
	2364
	2365	with self._datafp('w') as df:
	2366	for r in self:
	2367	df.write(self._getsegmentforrevs(r, r)[1])
	2368
	2369	with self._indexfp('w') as fp:
	2370	self.version &= ~FLAG_INLINE_DATA
	2371	self._inline = False
	2372	io = self._io
	2373	for i in self:
	2374	e = io.packentry(self.index[i], self.node, self.version, i)
	2375	fp.write(e)
	2376
	2377	# the temp file replace the real index when we exit the context
	2378	# manager
	2379
	2380	tr.replace(self.indexfile, trindex * self._io.size)
	2381	self._chunkclear()
	2382
	2383	def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
	2384	node=None, flags=REVIDX_DEFAULT_FLAGS, deltacomputer=None):
	2385	"""add a revision to the log
	2386
	2387	text - the revision data to add
	2388	transaction - the transaction object used for rollback
	2389	link - the linkrev data to add
	2390	p1, p2 - the parent nodeids of the revision
	2391	cachedelta - an optional precomputed delta
	2392	node - nodeid of revision; typically node is not specified, and it is
	2393	computed by default as hash(text, p1, p2), however subclasses might
	2394	use different hashing method (and override checkhash() in such case)
	2395	flags - the known flags to set on the revision
	2396	deltacomputer - an optional _deltacomputer instance shared between
	2397	multiple calls
	2398	"""
	2399	if link == nullrev:
	2400	raise RevlogError(_("attempted to add linkrev -1 to %s")
	2401	% self.indexfile)
	2402
	2403	if flags:
	2404	node = node or self.hash(text, p1, p2)
	2405
	2406	rawtext, validatehash = self._processflags(text, flags, 'write')
	2407
	2408	# If the flag processor modifies the revision data, ignore any provided
	2409	# cachedelta.
	2410	if rawtext != text:
	2411	cachedelta = None
	2412
	2413	if len(rawtext) > _maxentrysize:
	2414	raise RevlogError(
	2415	_("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")
	2416	% (self.indexfile, len(rawtext)))
	2417
	2418	node = node or self.hash(rawtext, p1, p2)
	2419	if node in self.nodemap:
	2420	return node
	2421
	2422	if validatehash:
	2423	self.checkhash(rawtext, node, p1=p1, p2=p2)
	2424
	2425	return self.addrawrevision(rawtext, transaction, link, p1, p2, node,
	2426	flags, cachedelta=cachedelta,
	2427	deltacomputer=deltacomputer)
	2428
	2429	def addrawrevision(self, rawtext, transaction, link, p1, p2, node, flags,
	2430	cachedelta=None, deltacomputer=None):
	2431	"""add a raw revision with known flags, node and parents
	2432	useful when reusing a revision not stored in this revlog (ex: received
	2433	over wire, or read from an external bundle).
	2434	"""
	2435	dfh = None
	2436	if not self._inline:
	2437	dfh = self._datafp("a+")
	2438	ifh = self._indexfp("a+")
	2439	try:
	2440	return self._addrevision(node, rawtext, transaction, link, p1, p2,
	2441	flags, cachedelta, ifh, dfh,
	2442	deltacomputer=deltacomputer)
	2443	finally:
	2444	if dfh:
	2445	dfh.close()
	2446	ifh.close()
	2447
	2448	def compress(self, data):
	2449	"""Generate a possibly-compressed representation of data."""
	2450	if not data:
	2451	return '', data
	2452
	2453	compressed = self._compressor.compress(data)
	2454
	2455	if compressed:
	2456	# The revlog compressor added the header in the returned data.
	2457	return '', compressed
	2458
	2459	if data[0:1] == '\0':
	2460	return '', data
	2461	return 'u', data
	2462
	2463	def decompress(self, data):
	2464	"""Decompress a revlog chunk.
	2465
	2466	The chunk is expected to begin with a header identifying the
	2467	format type so it can be routed to an appropriate decompressor.
	2468	"""
	2469	if not data:
	2470	return data
	2471
	2472	# Revlogs are read much more frequently than they are written and many
	2473	# chunks only take microseconds to decompress, so performance is
	2474	# important here.
	2475	#
	2476	# We can make a few assumptions about revlogs:
	2477	#
	2478	# 1) the majority of chunks will be compressed (as opposed to inline
	2479	# raw data).
	2480	# 2) decompressing any data will likely by at least 10x slower than
	2481	# returning raw inline data.
	2482	# 3) we want to prioritize common and officially supported compression
	2483	# engines
	2484	#
	2485	# It follows that we want to optimize for "decompress compressed data
	2486	# when encoded with common and officially supported compression engines"
	2487	# case over "raw data" and "data encoded by less common or non-official
	2488	# compression engines." That is why we have the inline lookup first
	2489	# followed by the compengines lookup.
	2490	#
	2491	# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
	2492	# compressed chunks. And this matters for changelog and manifest reads.
	2493	t = data[0:1]
	2494
	2495	if t == 'x':
	2496	try:
	2497	return _zlibdecompress(data)
	2498	except zlib.error as e:
	2499	raise RevlogError(_('revlog decompress error: %s') %
	2500	stringutil.forcebytestr(e))
	2501	# '\0' is more common than 'u' so it goes first.
	2502	elif t == '\0':
	2503	return data
	2504	elif t == 'u':
	2505	return util.buffer(data, 1)
	2506
	2507	try:
	2508	compressor = self._decompressors[t]
	2509	except KeyError:
	2510	try:
	2511	engine = util.compengines.forrevlogheader(t)
	2512	compressor = engine.revlogcompressor()
	2513	self._decompressors[t] = compressor
	2514	except KeyError:
	2515	raise RevlogError(_('unknown compression type %r') % t)
	2516
	2517	return compressor.decompress(data)
	2518
	2519	def _isgooddeltainfo(self, deltainfo, revinfo):
	2520	"""Returns True if the given delta is good. Good means that it is within
	2521	the disk span, disk size, and chain length bounds that we know to be
	2522	performant."""
	2523	if deltainfo is None:
	2524	return False
	2525
	2526	# - 'deltainfo.distance' is the distance from the base revision --
	2527	# bounding it limits the amount of I/O we need to do.
	2528	# - 'deltainfo.compresseddeltalen' is the sum of the total size of
	2529	# deltas we need to apply -- bounding it limits the amount of CPU
	2530	# we consume.
	2531
	2532	if self._sparserevlog:
	2533	# As sparse-read will be used, we can consider that the distance,
	2534	# instead of being the span of the whole chunk,
	2535	# is the span of the largest read chunk
	2536	base = deltainfo.base
	2537
	2538	if base != nullrev:
	2539	deltachain = self._deltachain(base)[0]
	2540	else:
	2541	deltachain = []
	2542
	2543	# search for the first non-snapshot revision
	2544	for idx, r in enumerate(deltachain):
	2545	if not self.issnapshot(r):
	2546	break
	2547	deltachain = deltachain[idx:]
	2548	chunks = _slicechunk(self, deltachain, deltainfo)
	2549	all_span = [_segmentspan(self, revs, deltainfo) for revs in chunks]
	2550	distance = max(all_span)
	2551	else:
	2552	distance = deltainfo.distance
	2553
	2554	textlen = revinfo.textlen
	2555	defaultmax = textlen * 4
	2556	maxdist = self._maxdeltachainspan
	2557	if not maxdist:
	2558	maxdist = distance # ensure the conditional pass
	2559	maxdist = max(maxdist, defaultmax)
	2560	if self._sparserevlog and maxdist < self._srmingapsize:
	2561	# In multiple place, we are ignoring irrelevant data range below a
	2562	# certain size. Be also apply this tradeoff here and relax span
	2563	# constraint for small enought content.
	2564	maxdist = self._srmingapsize
	2565
	2566	# Bad delta from read span:
	2567	#
	2568	# If the span of data read is larger than the maximum allowed.
	2569	if maxdist < distance:
	2570	return False
	2571
	2572	# Bad delta from new delta size:
	2573	#
	2574	# If the delta size is larger than the target text, storing the
	2575	# delta will be inefficient.
	2576	if textlen < deltainfo.deltalen:
	2577	return False
	2578
	2579	# Bad delta from cumulated payload size:
	2580	#
	2581	# If the sum of delta get larger than K * target text length.
	2582	if textlen * LIMIT_DELTA2TEXT < deltainfo.compresseddeltalen:
	2583	return False
	2584
	2585	# Bad delta from chain length:
	2586	#
	2587	# If the number of delta in the chain gets too high.
	2588	if self._maxchainlen and self._maxchainlen < deltainfo.chainlen:
	2589	return False
	2590
	2591	# bad delta from intermediate snapshot size limit
	2592	#
	2593	# If an intermediate snapshot size is higher than the limit. The
	2594	# limit exist to prevent endless chain of intermediate delta to be
	2595	# created.
	2596	if (deltainfo.snapshotdepth is not None and
	2597	(textlen >> deltainfo.snapshotdepth) < deltainfo.deltalen):
	2598	return False
	2599
	2600	# bad delta if new intermediate snapshot is larger than the previous
	2601	# snapshot
	2602	if (deltainfo.snapshotdepth
	2603	and self.length(deltainfo.base) < deltainfo.deltalen):
	2604	return False
	2605
	2606	return True
	2607
	2608	def _addrevision(self, node, rawtext, transaction, link, p1, p2, flags,
	2609	cachedelta, ifh, dfh, alwayscache=False,
	2610	deltacomputer=None):
	2611	"""internal function to add revisions to the log
	2612
	2613	see addrevision for argument descriptions.
	2614
	2615	note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
	2616
	2617	if "deltacomputer" is not provided or None, a defaultdeltacomputer will
	2618	be used.
	2619
	2620	invariants:
	2621	- rawtext is optional (can be None); if not set, cachedelta must be set.
	2622	if both are set, they must correspond to each other.
	2623	"""
	2624	if node == nullid:
	2625	raise RevlogError(_("%s: attempt to add null revision") %
	2626	(self.indexfile))
	2627	if node == wdirid or node in wdirfilenodeids:
	2628	raise RevlogError(_("%s: attempt to add wdir revision") %
	2629	(self.indexfile))
	2630
	2631	if self._inline:
	2632	fh = ifh
	2633	else:
	2634	fh = dfh
	2635
	2636	btext = [rawtext]
	2637
	2638	curr = len(self)
	2639	prev = curr - 1
	2640	offset = self.end(prev)
	2641	p1r, p2r = self.rev(p1), self.rev(p2)
	2642
	2643	# full versions are inserted when the needed deltas
	2644	# become comparable to the uncompressed text
	2645	if rawtext is None:
	2646	# need rawtext size, before changed by flag processors, which is
	2647	# the non-raw size. use revlog explicitly to avoid filelog's extra
	2648	# logic that might remove metadata size.
	2649	textlen = mdiff.patchedsize(revlog.size(self, cachedelta[0]),
	2650	cachedelta[1])
	2651	else:
	2652	textlen = len(rawtext)
	2653
	2654	if deltacomputer is None:
	2655	deltacomputer = _deltacomputer(self)
	2656
	2657	revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)
	2658
	2659	# no delta for flag processor revision (see "candelta" for why)
	2660	# not calling candelta since only one revision needs test, also to
	2661	# avoid overhead fetching flags again.
	2662	if flags & REVIDX_RAWTEXT_CHANGING_FLAGS:
	2663	deltainfo = None
	2664	else:
	2665	deltainfo = deltacomputer.finddeltainfo(revinfo, fh)
	2666
	2667	if deltainfo is not None:
	2668	base = deltainfo.base
	2669	chainbase = deltainfo.chainbase
	2670	data = deltainfo.data
	2671	l = deltainfo.deltalen
	2672	else:
	2673	rawtext = deltacomputer.buildtext(revinfo, fh)
	2674	data = self.compress(rawtext)
	2675	l = len(data[1]) + len(data[0])
	2676	base = chainbase = curr
	2677
	2678	e = (offset_type(offset, flags), l, textlen,
	2679	base, link, p1r, p2r, node)
	2680	self.index.append(e)
	2681	self.nodemap[node] = curr
	2682
	2683	entry = self._io.packentry(e, self.node, self.version, curr)
	2684	self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
	2685
	2686	if alwayscache and rawtext is None:
	2687	rawtext = deltacomputer.buildtext(revinfo, fh)
	2688
	2689	if type(rawtext) == bytes: # only accept immutable objects
	2690	self._cache = (node, curr, rawtext)
	2691	self._chainbasecache[curr] = chainbase
	2692	return node
	2693
	2694	def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
	2695	# Files opened in a+ mode have inconsistent behavior on various
	2696	# platforms. Windows requires that a file positioning call be made
	2697	# when the file handle transitions between reads and writes. See
	2698	# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
	2699	# platforms, Python or the platform itself can be buggy. Some versions
	2700	# of Solaris have been observed to not append at the end of the file
	2701	# if the file was seeked to before the end. See issue4943 for more.
	2702	#
	2703	# We work around this issue by inserting a seek() before writing.
	2704	# Note: This is likely not necessary on Python 3.
	2705	ifh.seek(0, os.SEEK_END)
	2706	if dfh:
	2707	dfh.seek(0, os.SEEK_END)
	2708
	2709	curr = len(self) - 1
	2710	if not self._inline:
	2711	transaction.add(self.datafile, offset)
	2712	transaction.add(self.indexfile, curr * len(entry))
	2713	if data[0]:
	2714	dfh.write(data[0])
	2715	dfh.write(data[1])
	2716	ifh.write(entry)
	2717	else:
	2718	offset += curr * self._io.size
	2719	transaction.add(self.indexfile, offset, curr)
	2720	ifh.write(entry)
	2721	ifh.write(data[0])
	2722	ifh.write(data[1])
	2723	self._enforceinlinesize(transaction, ifh)
	2724
	2725	def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
	2726	"""
	2727	add a delta group
	2728
	2729	given a set of deltas, add them to the revision log. the
	2730	first delta is against its parent, which should be in our
	2731	log, the rest are against the previous delta.
	2732
	2733	If ``addrevisioncb`` is defined, it will be called with arguments of
	2734	this revlog and the node that was added.
	2735	"""
	2736
	2737	nodes = []
	2738
	2739	r = len(self)
	2740	end = 0
	2741	if r:
	2742	end = self.end(r - 1)
	2743	ifh = self._indexfp("a+")
	2744	isize = r * self._io.size
	2745	if self._inline:
	2746	transaction.add(self.indexfile, end + isize, r)
	2747	dfh = None
	2748	else:
	2749	transaction.add(self.indexfile, isize, r)
	2750	transaction.add(self.datafile, end)
	2751	dfh = self._datafp("a+")
	2752	def flush():
	2753	if dfh:
	2754	dfh.flush()
	2755	ifh.flush()
	2756	try:
	2757	deltacomputer = _deltacomputer(self)
	2758	# loop through our set of deltas
	2759	for data in deltas:
	2760	node, p1, p2, linknode, deltabase, delta, flags = data
	2761	link = linkmapper(linknode)
	2762	flags = flags or REVIDX_DEFAULT_FLAGS
	2763
	2764	nodes.append(node)
	2765
	2766	if node in self.nodemap:
	2767	# this can happen if two branches make the same change
	2768	continue
	2769
	2770	for p in (p1, p2):
	2771	if p not in self.nodemap:
	2772	raise LookupError(p, self.indexfile,
	2773	_('unknown parent'))
	2774
	2775	if deltabase not in self.nodemap:
	2776	raise LookupError(deltabase, self.indexfile,
	2777	_('unknown delta base'))
	2778
	2779	baserev = self.rev(deltabase)
	2780
	2781	if baserev != nullrev and self.iscensored(baserev):
	2782	# if base is censored, delta must be full replacement in a
	2783	# single patch operation
	2784	hlen = struct.calcsize(">lll")
	2785	oldlen = self.rawsize(baserev)
	2786	newlen = len(delta) - hlen
	2787	if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
	2788	raise error.CensoredBaseError(self.indexfile,
	2789	self.node(baserev))
	2790
	2791	if not flags and self._peek_iscensored(baserev, delta, flush):
	2792	flags \|= REVIDX_ISCENSORED
	2793
	2794	# We assume consumers of addrevisioncb will want to retrieve
	2795	# the added revision, which will require a call to
	2796	# revision(). revision() will fast path if there is a cache
	2797	# hit. So, we tell _addrevision() to always cache in this case.
	2798	# We're only using addgroup() in the context of changegroup
	2799	# generation so the revision data can always be handled as raw
	2800	# by the flagprocessor.
	2801	self._addrevision(node, None, transaction, link,
	2802	p1, p2, flags, (baserev, delta),
	2803	ifh, dfh,
	2804	alwayscache=bool(addrevisioncb),
	2805	deltacomputer=deltacomputer)
	2806
	2807	if addrevisioncb:
	2808	addrevisioncb(self, node)
	2809
	2810	if not dfh and not self._inline:
	2811	# addrevision switched from inline to conventional
	2812	# reopen the index
	2813	ifh.close()
	2814	dfh = self._datafp("a+")
	2815	ifh = self._indexfp("a+")
	2816	finally:
	2817	if dfh:
	2818	dfh.close()
	2819	ifh.close()
	2820
	2821	return nodes
	2822
	2823	def iscensored(self, rev):
	2824	"""Check if a file revision is censored."""
	2825	if not self._censorable:
	2826	return False
	2827
	2828	return self.flags(rev) & REVIDX_ISCENSORED
	2829
	2830	def _peek_iscensored(self, baserev, delta, flush):
	2831	"""Quickly check if a delta produces a censored revision."""
	2832	if not self._censorable:
	2833	return False
	2834
	2835	# Fragile heuristic: unless new file meta keys are added alphabetically
	2836	# preceding "censored", all censored revisions are prefixed by
	2837	# "\1\ncensored:". A delta producing such a censored revision must be a
	2838	# full-replacement delta, so we inspect the first and only patch in the
	2839	# delta for this prefix.
	2840	hlen = struct.calcsize(">lll")
	2841	if len(delta) <= hlen:
	2842	return False
	2843
	2844	oldlen = self.rawsize(baserev)
	2845	newlen = len(delta) - hlen
	2846	if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
	2847	return False
	2848
	2849	add = "\1\ncensored:"
	2850	addlen = len(add)
	2851	return newlen >= addlen and delta[hlen:hlen + addlen] == add
	2852
	2853	def getstrippoint(self, minlink):
	2854	"""find the minimum rev that must be stripped to strip the linkrev
	2855
	2856	Returns a tuple containing the minimum rev and a set of all revs that
	2857	have linkrevs that will be broken by this strip.
	2858	"""
	2859	brokenrevs = set()
	2860	strippoint = len(self)
	2861
	2862	heads = {}
	2863	futurelargelinkrevs = set()
	2864	for head in self.headrevs():
	2865	headlinkrev = self.linkrev(head)
	2866	heads[head] = headlinkrev
	2867	if headlinkrev >= minlink:
	2868	futurelargelinkrevs.add(headlinkrev)
	2869
	2870	# This algorithm involves walking down the rev graph, starting at the
	2871	# heads. Since the revs are topologically sorted according to linkrev,
	2872	# once all head linkrevs are below the minlink, we know there are
	2873	# no more revs that could have a linkrev greater than minlink.
	2874	# So we can stop walking.
	2875	while futurelargelinkrevs:
	2876	strippoint -= 1
	2877	linkrev = heads.pop(strippoint)
	2878
	2879	if linkrev < minlink:
	2880	brokenrevs.add(strippoint)
	2881	else:
	2882	futurelargelinkrevs.remove(linkrev)
	2883
	2884	for p in self.parentrevs(strippoint):
	2885	if p != nullrev:
	2886	plinkrev = self.linkrev(p)
	2887	heads[p] = plinkrev
	2888	if plinkrev >= minlink:
	2889	futurelargelinkrevs.add(plinkrev)
	2890
	2891	return strippoint, brokenrevs
	2892
	2893	def strip(self, minlink, transaction):
	2894	"""truncate the revlog on the first revision with a linkrev >= minlink
	2895
	2896	This function is called when we're stripping revision minlink and
	2897	its descendants from the repository.
	2898
	2899	We have to remove all revisions with linkrev >= minlink, because
	2900	the equivalent changelog revisions will be renumbered after the
	2901	strip.
	2902
	2903	So we truncate the revlog on the first of these revisions, and
	2904	trust that the caller has saved the revisions that shouldn't be
	2905	removed and that it'll re-add them after this truncation.
	2906	"""
	2907	if len(self) == 0:
	2908	return
	2909
	2910	rev, _ = self.getstrippoint(minlink)
	2911	if rev == len(self):
	2912	return
	2913
	2914	# first truncate the files on disk
	2915	end = self.start(rev)
	2916	if not self._inline:
	2917	transaction.add(self.datafile, end)
	2918	end = rev * self._io.size
	2919	else:
	2920	end += rev * self._io.size
	2921
	2922	transaction.add(self.indexfile, end)
	2923
	2924	# then reset internal state in memory to forget those revisions
	2925	self._cache = None
	2926	self._chaininfocache = {}
	2927	self._chunkclear()
	2928	for x in pycompat.xrange(rev, len(self)):
	2929	del self.nodemap[self.node(x)]
	2930
	2931	del self.index[rev:-1]
	2932	self._nodepos = None
	2933
	2934	def checksize(self):
	2935	expected = 0
	2936	if len(self):
	2937	expected = max(0, self.end(len(self) - 1))
	2938
	2939	try:
	2940	with self._datafp() as f:
	2941	f.seek(0, 2)
	2942	actual = f.tell()
	2943	dd = actual - expected
	2944	except IOError as inst:
	2945	if inst.errno != errno.ENOENT:
	2946	raise
	2947	dd = 0
	2948
	2949	try:
	2950	f = self.opener(self.indexfile)
	2951	f.seek(0, 2)
	2952	actual = f.tell()
	2953	f.close()
	2954	s = self._io.size
	2955	i = max(0, actual // s)
	2956	di = actual - (i * s)
	2957	if self._inline:
	2958	databytes = 0
	2959	for r in self:
	2960	databytes += max(0, self.length(r))
	2961	dd = 0
	2962	di = actual - len(self) * s - databytes
	2963	except IOError as inst:
	2964	if inst.errno != errno.ENOENT:
	2965	raise
	2966	di = 0
	2967
	2968	return (dd, di)
	2969
	2970	def files(self):
	2971	res = [self.indexfile]
	2972	if not self._inline:
	2973	res.append(self.datafile)
	2974	return res
	2975
	2976	def emitrevisiondeltas(self, requests):
	2977	frev = self.rev
	2978
	2979	prevrev = None
	2980	for request in requests:
	2981	node = request.node
	2982	rev = frev(node)
	2983
	2984	if prevrev is None:
	2985	prevrev = self.index[rev][5]
	2986
	2987	# Requesting a full revision.
	2988	if request.basenode == nullid:
	2989	baserev = nullrev
	2990	# Requesting an explicit revision.
	2991	elif request.basenode is not None:
	2992	baserev = frev(request.basenode)
	2993	# Allowing us to choose.
	2994	else:
	2995	p1rev, p2rev = self.parentrevs(rev)
	2996	deltaparentrev = self.deltaparent(rev)
	2997
	2998	# Avoid sending full revisions when delta parent is null. Pick
	2999	# prev in that case. It's tempting to pick p1 in this case, as
	3000	# p1 will be smaller in the common case. However, computing a
	3001	# delta against p1 may require resolving the raw text of p1,
	3002	# which could be expensive. The revlog caches should have prev
	3003	# cached, meaning less CPU for delta generation. There is
	3004	# likely room to add a flag and/or config option to control this
	3005	# behavior.
	3006	if deltaparentrev == nullrev and self._storedeltachains:
	3007	baserev = prevrev
	3008
	3009	# Revlog is configured to use full snapshot for a reason.
	3010	# Stick to full snapshot.
	3011	elif deltaparentrev == nullrev:
	3012	baserev = nullrev
	3013
	3014	# Pick previous when we can't be sure the base is available
	3015	# on consumer.
	3016	elif deltaparentrev not in (p1rev, p2rev, prevrev):
	3017	baserev = prevrev
	3018	else:
	3019	baserev = deltaparentrev
	3020
	3021	if baserev != nullrev and not self.candelta(baserev, rev):
	3022	baserev = nullrev
	3023
	3024	revision = None
	3025	delta = None
	3026	baserevisionsize = None
	3027
	3028	if self.iscensored(baserev) or self.iscensored(rev):
	3029	try:
	3030	revision = self.revision(node, raw=True)
	3031	except error.CensoredNodeError as e:
	3032	revision = e.tombstone
	3033
	3034	if baserev != nullrev:
	3035	baserevisionsize = self.rawsize(baserev)
	3036
	3037	elif baserev == nullrev:
	3038	revision = self.revision(node, raw=True)
	3039	else:
	3040	delta = self.revdiff(baserev, rev)
	3041
	3042	extraflags = REVIDX_ELLIPSIS if request.ellipsis else 0
	3043
	3044	yield revlogrevisiondelta(
	3045	node=node,
	3046	p1node=request.p1node,
	3047	p2node=request.p2node,
	3048	linknode=request.linknode,
	3049	basenode=self.node(baserev),
	3050	flags=self.flags(rev) \| extraflags,
	3051	baserevisionsize=baserevisionsize,
	3052	revision=revision,
	3053	delta=delta)
	3054
	3055	prevrev = rev
	3056
	3057	DELTAREUSEALWAYS = 'always'
	3058	DELTAREUSESAMEREVS = 'samerevs'
	3059	DELTAREUSENEVER = 'never'
	3060
	3061	DELTAREUSEFULLADD = 'fulladd'
	3062
	3063	DELTAREUSEALL = {'always', 'samerevs', 'never', 'fulladd'}
	3064
	3065	def clone(self, tr, destrevlog, addrevisioncb=None,
	3066	deltareuse=DELTAREUSESAMEREVS, deltabothparents=None):
	3067	"""Copy this revlog to another, possibly with format changes.
	3068
	3069	The destination revlog will contain the same revisions and nodes.
	3070	However, it may not be bit-for-bit identical due to e.g. delta encoding
	3071	differences.
	3072
	3073	The ``deltareuse`` argument control how deltas from the existing revlog
	3074	are preserved in the destination revlog. The argument can have the
	3075	following values:
	3076
	3077	DELTAREUSEALWAYS
	3078	Deltas will always be reused (if possible), even if the destination
	3079	revlog would not select the same revisions for the delta. This is the
	3080	fastest mode of operation.
	3081	DELTAREUSESAMEREVS
	3082	Deltas will be reused if the destination revlog would pick the same
	3083	revisions for the delta. This mode strikes a balance between speed
	3084	and optimization.
	3085	DELTAREUSENEVER
	3086	Deltas will never be reused. This is the slowest mode of execution.
	3087	This mode can be used to recompute deltas (e.g. if the diff/delta
	3088	algorithm changes).
	3089
	3090	Delta computation can be slow, so the choice of delta reuse policy can
	3091	significantly affect run time.
	3092
	3093	The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
	3094	two extremes. Deltas will be reused if they are appropriate. But if the
	3095	delta could choose a better revision, it will do so. This means if you
	3096	are converting a non-generaldelta revlog to a generaldelta revlog,
	3097	deltas will be recomputed if the delta's parent isn't a parent of the
	3098	revision.
	3099
	3100	In addition to the delta policy, the ``deltabothparents`` argument
	3101	controls whether to compute deltas against both parents for merges.
	3102	By default, the current default is used.
	3103	"""
	3104	if deltareuse not in self.DELTAREUSEALL:
	3105	raise ValueError(_('value for deltareuse invalid: %s') % deltareuse)
	3106
	3107	if len(destrevlog):
	3108	raise ValueError(_('destination revlog is not empty'))
	3109
	3110	if getattr(self, 'filteredrevs', None):
	3111	raise ValueError(_('source revlog has filtered revisions'))
	3112	if getattr(destrevlog, 'filteredrevs', None):
	3113	raise ValueError(_('destination revlog has filtered revisions'))
	3114
	3115	# lazydeltabase controls whether to reuse a cached delta, if possible.
	3116	oldlazydeltabase = destrevlog._lazydeltabase
	3117	oldamd = destrevlog._deltabothparents
	3118
	3119	try:
	3120	if deltareuse == self.DELTAREUSEALWAYS:
	3121	destrevlog._lazydeltabase = True
	3122	elif deltareuse == self.DELTAREUSESAMEREVS:
	3123	destrevlog._lazydeltabase = False
	3124
	3125	destrevlog._deltabothparents = deltabothparents or oldamd
	3126
	3127	populatecachedelta = deltareuse in (self.DELTAREUSEALWAYS,
	3128	self.DELTAREUSESAMEREVS)
	3129
	3130	deltacomputer = _deltacomputer(destrevlog)
	3131	index = self.index
	3132	for rev in self:
	3133	entry = index[rev]
	3134
	3135	# Some classes override linkrev to take filtered revs into
	3136	# account. Use raw entry from index.
	3137	flags = entry[0] & 0xffff
	3138	linkrev = entry[4]
	3139	p1 = index[entry[5]][7]
	3140	p2 = index[entry[6]][7]
	3141	node = entry[7]
	3142
	3143	# (Possibly) reuse the delta from the revlog if allowed and
	3144	# the revlog chunk is a delta.
	3145	cachedelta = None
	3146	rawtext = None
	3147	if populatecachedelta:
	3148	dp = self.deltaparent(rev)
	3149	if dp != nullrev:
	3150	cachedelta = (dp, bytes(self._chunk(rev)))
	3151
	3152	if not cachedelta:
	3153	rawtext = self.revision(rev, raw=True)
	3154
	3155
	3156	if deltareuse == self.DELTAREUSEFULLADD:
	3157	destrevlog.addrevision(rawtext, tr, linkrev, p1, p2,
	3158	cachedelta=cachedelta,
	3159	node=node, flags=flags,
	3160	deltacomputer=deltacomputer)
	3161	else:
	3162	ifh = destrevlog.opener(destrevlog.indexfile, 'a+',
	3163	checkambig=False)
	3164	dfh = None
	3165	if not destrevlog._inline:
	3166	dfh = destrevlog.opener(destrevlog.datafile, 'a+')
	3167	try:
	3168	destrevlog._addrevision(node, rawtext, tr, linkrev, p1,
	3169	p2, flags, cachedelta, ifh, dfh,
	3170	deltacomputer=deltacomputer)
	3171	finally:
	3172	if dfh:
	3173	dfh.close()
	3174	ifh.close()
	3175
	3176	if addrevisioncb:
	3177	addrevisioncb(self, rev, node)
	3178	finally:
	3179	destrevlog._lazydeltabase = oldlazydeltabase
	3180	destrevlog._deltabothparents = oldamd

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages