upstream/mercurial-mirror Commit - r39366:655b5b46

revlog: split functionality related to deltas computation in a new module...

Boris Feld -

r39366:655b5b46 default

parent child

mercurial/debugcommands.py

0 +5 -1

              # debugcommands.py - command processing for debug* commands
              #
              # Copyright 2005-2016 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import codecs
              import collections
              import difflib
              import errno
              import operator
              import os
              import random
              import re
              import socket
              import ssl
              import stat
              import string
              import subprocess
              import sys
              import time
              from .i18n import _
              from .node import (
                  bin,
                  hex,
                  nullhex,
                  nullid,
                  nullrev,
                  short,
              )
              from .thirdparty import (
                  cbor,
              )
              from . import (
                  bundle2,
                  changegroup,
                  cmdutil,
                  color,
                  context,
                  dagparser,
                  encoding,
                  error,
                  exchange,
                  extensions,
                  filemerge,
                  filesetlang,
                  formatter,
                  hg,
                  httppeer,
                  localrepo,
                  lock as lockmod,
                  logcmdutil,
                  merge as mergemod,
                  obsolete,
                  obsutil,
                  phases,
                  policy,
                  pvec,
                  pycompat,
                  registrar,
                  repair,
                  revlog,
                  revset,
                  revsetlang,
                  scmutil,
                  setdiscovery,
                  simplemerge,
                  sshpeer,
                  sslutil,
                  streamclone,
                  templater,
                  treediscovery,
                  upgrade,
                  url as urlmod,
                  util,
                  vfs as vfsmod,
                  wireprotoframing,
                  wireprotoserver,
                  wireprotov2peer,
              )
              from .utils import (
                  dateutil,
                  procutil,
                  stringutil,
              )
+             from .revlogutils import (
+                 deltas as deltautil
+             )
              release = lockmod.release
              command = registrar.command()
              @command('debugancestor', [], _('[INDEX] REV1 REV2'), optionalrepo=True)
              def debugancestor(ui, repo, *args):
                  """find the ancestor revision of two revisions in a given index"""
                  if len(args) == 3:
                      index, rev1, rev2 = args
                      r = revlog.revlog(vfsmod.vfs(pycompat.getcwd(), audit=False), index)
                      lookup = r.lookup
                  elif len(args) == 2:
                      if not repo:
                          raise error.Abort(_('there is no Mercurial repository here '
                                              '(.hg not found)'))
                      rev1, rev2 = args
                      r = repo.changelog
                      lookup = repo.lookup
                  else:
                      raise error.Abort(_('either two or three arguments required'))
                  a = r.ancestor(lookup(rev1), lookup(rev2))
                  ui.write('%d:%s\n' % (r.rev(a), hex(a)))
              @command('debugapplystreamclonebundle', [], 'FILE')
              def debugapplystreamclonebundle(ui, repo, fname):
                  """apply a stream clone bundle file"""
                  f = hg.openpath(ui, fname)
                  gen = exchange.readbundle(ui, f, fname)
                  gen.apply(repo)
              @command('debugbuilddag',
                  [('m', 'mergeable-file', None, _('add single file mergeable changes')),
                  ('o', 'overwritten-file', None, _('add single file all revs overwrite')),
                  ('n', 'new-file', None, _('add new file at each rev'))],
                  _('[OPTION]... [TEXT]'))
              def debugbuilddag(ui, repo, text=None,
                                mergeable_file=False,
                                overwritten_file=False,
                                new_file=False):
                  """builds a repo with a given DAG from scratch in the current empty repo
                  The description of the DAG is read from stdin if not given on the
                  command line.
                  Elements:
                   - "+n" is a linear run of n nodes based on the current default parent
                   - "." is a single node based on the current default parent
                   - "$" resets the default parent to null (implied at the start);
                         otherwise the default parent is always the last node created
                   - "<p" sets the default parent to the backref p
                   - "*p" is a fork at parent p, which is a backref
                   - "*p1/p2" is a merge of parents p1 and p2, which are backrefs
                   - "/p2" is a merge of the preceding node and p2
                   - ":tag" defines a local tag for the preceding node
                   - "@branch" sets the named branch for subsequent nodes
                   - "#...\\n" is a comment up to the end of the line
                  Whitespace between the above elements is ignored.
                  A backref is either
                   - a number n, which references the node curr-n, where curr is the current
                     node, or
                   - the name of a local tag you placed earlier using ":tag", or
                   - empty to denote the default parent.
                  All string valued-elements are either strictly alphanumeric, or must
                  be enclosed in double quotes ("..."), with "\\" as escape character.
                  """
                  if text is None:
                      ui.status(_("reading DAG from stdin\n"))
                      text = ui.fin.read()
                  cl = repo.changelog
                  if len(cl) > 0:
                      raise error.Abort(_('repository is not empty'))
                  # determine number of revs in DAG
                  total = 0
                  for type, data in dagparser.parsedag(text):
                      if type == 'n':
                          total += 1
                  if mergeable_file:
                      linesperrev = 2
                      # make a file with k lines per rev
                      initialmergedlines = ['%d' % i
                                            for i in pycompat.xrange(0, total * linesperrev)]
                      initialmergedlines.append("")
                  tags = []
                  progress = ui.makeprogress(_('building'), unit=_('revisions'),
                                             total=total)
                  with progress, repo.wlock(), repo.lock(), repo.transaction("builddag"):
                      at = -1
                      atbranch = 'default'
                      nodeids = []
                      id = 0
                      progress.update(id)
                      for type, data in dagparser.parsedag(text):
                          if type == 'n':
                              ui.note(('node %s\n' % pycompat.bytestr(data)))
                              id, ps = data
                              files = []
                              filecontent = {}
                              p2 = None
                              if mergeable_file:
                                  fn = "mf"
                                  p1 = repo[ps[0]]
                                  if len(ps) > 1:
                                      p2 = repo[ps[1]]
                                      pa = p1.ancestor(p2)
                                      base, local, other = [x[fn].data() for x in (pa, p1,
                                                                                   p2)]
                                      m3 = simplemerge.Merge3Text(base, local, other)
                                      ml = [l.strip() for l in m3.merge_lines()]
                                      ml.append("")
                                  elif at > 0:
                                      ml = p1[fn].data().split("\n")
                                  else:
                                      ml = initialmergedlines
                                  ml[id * linesperrev] += " r%i" % id
                                  mergedtext = "\n".join(ml)
                                  files.append(fn)
                                  filecontent[fn] = mergedtext
                              if overwritten_file:
                                  fn = "of"
                                  files.append(fn)
                                  filecontent[fn] = "r%i\n" % id
                              if new_file:
                                  fn = "nf%i" % id
                                  files.append(fn)
                                  filecontent[fn] = "r%i\n" % id
                                  if len(ps) > 1:
                                      if not p2:
                                          p2 = repo[ps[1]]
                                      for fn in p2:
                                          if fn.startswith("nf"):
                                              files.append(fn)
                                              filecontent[fn] = p2[fn].data()
                              def fctxfn(repo, cx, path):
                                  if path in filecontent:
                                      return context.memfilectx(repo, cx, path,
                                                                filecontent[path])
                                  return None
                              if len(ps) == 0 or ps[0] < 0:
                                  pars = [None, None]
                              elif len(ps) == 1:
                                  pars = [nodeids[ps[0]], None]
                              else:
                                  pars = [nodeids[p] for p in ps]
                              cx = context.memctx(repo, pars, "r%i" % id, files, fctxfn,
                                                  date=(id, 0),
                                                  user="debugbuilddag",
                                                  extra={'branch': atbranch})
                              nodeid = repo.commitctx(cx)
                              nodeids.append(nodeid)
                              at = id
                          elif type == 'l':
                              id, name = data
                              ui.note(('tag %s\n' % name))
                              tags.append("%s %s\n" % (hex(repo.changelog.node(id)), name))
                          elif type == 'a':
                              ui.note(('branch %s\n' % data))
                              atbranch = data
                          progress.update(id)
                      if tags:
                          repo.vfs.write("localtags", "".join(tags))
              def _debugchangegroup(ui, gen, all=None, indent=0, **opts):
                  indent_string = ' ' * indent
                  if all:
                      ui.write(("%sformat: id, p1, p2, cset, delta base, len(delta)\n")
                               % indent_string)
                      def showchunks(named):
                          ui.write("\n%s%s\n" % (indent_string, named))
                          for deltadata in gen.deltaiter():
                              node, p1, p2, cs, deltabase, delta, flags = deltadata
                              ui.write("%s%s %s %s %s %s %d\n" %
                                       (indent_string, hex(node), hex(p1), hex(p2),
                                        hex(cs), hex(deltabase), len(delta)))
                      chunkdata = gen.changelogheader()
                      showchunks("changelog")
                      chunkdata = gen.manifestheader()
                      showchunks("manifest")
                      for chunkdata in iter(gen.filelogheader, {}):
                          fname = chunkdata['filename']
                          showchunks(fname)
                  else:
                      if isinstance(gen, bundle2.unbundle20):
                          raise error.Abort(_('use debugbundle2 for this file'))
                      chunkdata = gen.changelogheader()
                      for deltadata in gen.deltaiter():
                          node, p1, p2, cs, deltabase, delta, flags = deltadata
                          ui.write("%s%s\n" % (indent_string, hex(node)))
              def _debugobsmarkers(ui, part, indent=0, **opts):
                  """display version and markers contained in 'data'"""
                  opts = pycompat.byteskwargs(opts)
                  data = part.read()
                  indent_string = ' ' * indent
                  try:
                      version, markers = obsolete._readmarkers(data)
                  except error.UnknownVersion as exc:
                      msg = "%sunsupported version: %s (%d bytes)\n"
                      msg %= indent_string, exc.version, len(data)
                      ui.write(msg)
                  else:
                      msg = "%sversion: %d (%d bytes)\n"
                      msg %= indent_string, version, len(data)
                      ui.write(msg)
                      fm = ui.formatter('debugobsolete', opts)
                      for rawmarker in sorted(markers):
                          m = obsutil.marker(None, rawmarker)
                          fm.startitem()
                          fm.plain(indent_string)
                          cmdutil.showmarker(fm, m)
                      fm.end()
              def _debugphaseheads(ui, data, indent=0):
                  """display version and markers contained in 'data'"""
                  indent_string = ' ' * indent
                  headsbyphase = phases.binarydecode(data)
                  for phase in phases.allphases:
                      for head in headsbyphase[phase]:
                          ui.write(indent_string)
                          ui.write('%s %s\n' % (hex(head), phases.phasenames[phase]))
              def _quasirepr(thing):
                  if isinstance(thing, (dict, util.sortdict, collections.OrderedDict)):
                      return '{%s}' % (
                          b', '.join(b'%s: %s' % (k, thing[k]) for k in sorted(thing)))
                  return pycompat.bytestr(repr(thing))
              def _debugbundle2(ui, gen, all=None, **opts):
                  """lists the contents of a bundle2"""
                  if not isinstance(gen, bundle2.unbundle20):
                      raise error.Abort(_('not a bundle2 file'))
                  ui.write(('Stream params: %s\n' % _quasirepr(gen.params)))
                  parttypes = opts.get(r'part_type', [])
                  for part in gen.iterparts():
                      if parttypes and part.type not in parttypes:
                          continue
                      msg = '%s -- %s (mandatory: %r)\n'
                      ui.write((msg % (part.type, _quasirepr(part.params), part.mandatory)))
                      if part.type == 'changegroup':
                          version = part.params.get('version', '01')
                          cg = changegroup.getunbundler(version, part, 'UN')
                          if not ui.quiet:
                              _debugchangegroup(ui, cg, all=all, indent=4, **opts)
                      if part.type == 'obsmarkers':
                          if not ui.quiet:
                              _debugobsmarkers(ui, part, indent=4, **opts)
                      if part.type == 'phase-heads':
                          if not ui.quiet:
                              _debugphaseheads(ui, part, indent=4)
              @command('debugbundle',
                      [('a', 'all', None, _('show all details')),
                       ('', 'part-type', [], _('show only the named part type')),
                       ('', 'spec', None, _('print the bundlespec of the bundle'))],
                      _('FILE'),
                      norepo=True)
              def debugbundle(ui, bundlepath, all=None, spec=None, **opts):
                  """lists the contents of a bundle"""
                  with hg.openpath(ui, bundlepath) as f:
                      if spec:
                          spec = exchange.getbundlespec(ui, f)
                          ui.write('%s\n' % spec)
                          return
                      gen = exchange.readbundle(ui, f, bundlepath)
                      if isinstance(gen, bundle2.unbundle20):
                          return _debugbundle2(ui, gen, all=all, **opts)
                      _debugchangegroup(ui, gen, all=all, **opts)
              @command('debugcapabilities',
                      [], _('PATH'),
                      norepo=True)
              def debugcapabilities(ui, path, **opts):
                  """lists the capabilities of a remote peer"""
                  opts = pycompat.byteskwargs(opts)
                  peer = hg.peer(ui, opts, path)
                  caps = peer.capabilities()
                  ui.write(('Main capabilities:\n'))
                  for c in sorted(caps):
                      ui.write(('  %s\n') % c)
                  b2caps = bundle2.bundle2caps(peer)
                  if b2caps:
                      ui.write(('Bundle2 capabilities:\n'))
                      for key, values in sorted(b2caps.iteritems()):
                          ui.write(('  %s\n') % key)
                          for v in values:
                              ui.write(('    %s\n') % v)
              @command('debugcheckstate', [], '')
              def debugcheckstate(ui, repo):
                  """validate the correctness of the current dirstate"""
                  parent1, parent2 = repo.dirstate.parents()
                  m1 = repo[parent1].manifest()
                  m2 = repo[parent2].manifest()
                  errors = 0
                  for f in repo.dirstate:
                      state = repo.dirstate[f]
                      if state in "nr" and f not in m1:
                          ui.warn(_("%s in state %s, but not in manifest1\n") % (f, state))
                          errors += 1
                      if state in "a" and f in m1:
                          ui.warn(_("%s in state %s, but also in manifest1\n") % (f, state))
                          errors += 1
                      if state in "m" and f not in m1 and f not in m2:
                          ui.warn(_("%s in state %s, but not in either manifest\n") %
                                  (f, state))
                          errors += 1
                  for f in m1:
                      state = repo.dirstate[f]
                      if state not in "nrm":
                          ui.warn(_("%s in manifest1, but listed as state %s") % (f, state))
                          errors += 1
                  if errors:
                      error = _(".hg/dirstate inconsistent with current parent's manifest")
                      raise error.Abort(error)
              @command('debugcolor',
                      [('', 'style', None, _('show all configured styles'))],
                      'hg debugcolor')
              def debugcolor(ui, repo, **opts):
                  """show available color, effects or style"""
                  ui.write(('color mode: %s\n') % stringutil.pprint(ui._colormode))
                  if opts.get(r'style'):
                      return _debugdisplaystyle(ui)
                  else:
                      return _debugdisplaycolor(ui)
              def _debugdisplaycolor(ui):
                  ui = ui.copy()
                  ui._styles.clear()
                  for effect in color._activeeffects(ui).keys():
                      ui._styles[effect] = effect
                  if ui._terminfoparams:
                      for k, v in ui.configitems('color'):
                          if k.startswith('color.'):
                              ui._styles[k] = k[6:]
                          elif k.startswith('terminfo.'):
                              ui._styles[k] = k[9:]
                  ui.write(_('available colors:\n'))
                  # sort label with a '_' after the other to group '_background' entry.
                  items = sorted(ui._styles.items(),
                                 key=lambda i: ('_' in i[0], i[0], i[1]))
                  for colorname, label in items:
                      ui.write(('%s\n') % colorname, label=label)
              def _debugdisplaystyle(ui):
                  ui.write(_('available style:\n'))
                  if not ui._styles:
                      return
                  width = max(len(s) for s in ui._styles)
                  for label, effects in sorted(ui._styles.items()):
                      ui.write('%s' % label, label=label)
                      if effects:
                          # 50
                          ui.write(': ')
                          ui.write(' ' * (max(0, width - len(label))))
                          ui.write(', '.join(ui.label(e, e) for e in effects.split()))
                      ui.write('\n')
              @command('debugcreatestreamclonebundle', [], 'FILE')
              def debugcreatestreamclonebundle(ui, repo, fname):
                  """create a stream clone bundle file
                  Stream bundles are special bundles that are essentially archives of
                  revlog files. They are commonly used for cloning very quickly.
                  """
                  # TODO we may want to turn this into an abort when this functionality
                  # is moved into `hg bundle`.
                  if phases.hassecret(repo):
                      ui.warn(_('(warning: stream clone bundle will contain secret '
                                'revisions)\n'))
                  requirements, gen = streamclone.generatebundlev1(repo)
                  changegroup.writechunks(ui, gen, fname)
                  ui.write(_('bundle requirements: %s\n') % ', '.join(sorted(requirements)))
              @command('debugdag',
                  [('t', 'tags', None, _('use tags as labels')),
                  ('b', 'branches', None, _('annotate with branch names')),
                  ('', 'dots', None, _('use dots for runs')),
                  ('s', 'spaces', None, _('separate elements by spaces'))],
                  _('[OPTION]... [FILE [REV]...]'),
                  optionalrepo=True)
              def debugdag(ui, repo, file_=None, *revs, **opts):
                  """format the changelog or an index DAG as a concise textual description
                  If you pass a revlog index, the revlog's DAG is emitted. If you list
                  revision numbers, they get labeled in the output as rN.
                  Otherwise, the changelog DAG of the current repo is emitted.
                  """
                  spaces = opts.get(r'spaces')
                  dots = opts.get(r'dots')
                  if file_:
                      rlog = revlog.revlog(vfsmod.vfs(pycompat.getcwd(), audit=False),
                                           file_)
                      revs = set((int(r) for r in revs))
                      def events():
                          for r in rlog:
                              yield 'n', (r, list(p for p in rlog.parentrevs(r)
                                                      if p != -1))
                              if r in revs:
                                  yield 'l', (r, "r%i" % r)
                  elif repo:
                      cl = repo.changelog
                      tags = opts.get(r'tags')
                      branches = opts.get(r'branches')
                      if tags:
                          labels = {}
                          for l, n in repo.tags().items():
                              labels.setdefault(cl.rev(n), []).append(l)
                      def events():
                          b = "default"
                          for r in cl:
                              if branches:
                                  newb = cl.read(cl.node(r))[5]['branch']
                                  if newb != b:
                                      yield 'a', newb
                                      b = newb
                              yield 'n', (r, list(p for p in cl.parentrevs(r)
                                                      if p != -1))
                              if tags:
                                  ls = labels.get(r)
                                  if ls:
                                      for l in ls:
                                          yield 'l', (r, l)
                  else:
                      raise error.Abort(_('need repo for changelog dag'))
                  for line in dagparser.dagtextlines(events(),
                                                     addspaces=spaces,
                                                     wraplabels=True,
                                                     wrapannotations=True,
                                                     wrapnonlinear=dots,
                                                     usedots=dots,
                                                     maxlinewidth=70):
                      ui.write(line)
                      ui.write("\n")
              @command('debugdata', cmdutil.debugrevlogopts, _('-c|-m|FILE REV'))
              def debugdata(ui, repo, file_, rev=None, **opts):
                  """dump the contents of a data file revision"""
                  opts = pycompat.byteskwargs(opts)
                  if opts.get('changelog') or opts.get('manifest') or opts.get('dir'):
                      if rev is not None:
                          raise error.CommandError('debugdata', _('invalid arguments'))
                      file_, rev = None, file_
                  elif rev is None:
                      raise error.CommandError('debugdata', _('invalid arguments'))
                  r = cmdutil.openstorage(repo, 'debugdata', file_, opts)
                  try:
                      ui.write(r.revision(r.lookup(rev), raw=True))
                  except KeyError:
                      raise error.Abort(_('invalid revision identifier %s') % rev)
              @command('debugdate',
                  [('e', 'extended', None, _('try extended date formats'))],
                  _('[-e] DATE [RANGE]'),
                  norepo=True, optionalrepo=True)
              def debugdate(ui, date, range=None, **opts):
                  """parse and display a date"""
                  if opts[r"extended"]:
                      d = dateutil.parsedate(date, util.extendeddateformats)
                  else:
                      d = dateutil.parsedate(date)
                  ui.write(("internal: %d %d\n") % d)
                  ui.write(("standard: %s\n") % dateutil.datestr(d))
                  if range:
                      m = dateutil.matchdate(range)
                      ui.write(("match: %s\n") % m(d[0]))
              @command('debugdeltachain',
                  cmdutil.debugrevlogopts + cmdutil.formatteropts,
                  _('-c|-m|FILE'),
                  optionalrepo=True)
              def debugdeltachain(ui, repo, file_=None, **opts):
                  """dump information about delta chains in a revlog
                  Output can be templatized. Available template keywords are:
                  :``rev``:       revision number
                  :``chainid``:   delta chain identifier (numbered by unique base)
                  :``chainlen``:  delta chain length to this revision
                  :``prevrev``:   previous revision in delta chain
                  :``deltatype``: role of delta / how it was computed
                  :``compsize``:  compressed size of revision
                  :``uncompsize``: uncompressed size of revision
                  :``chainsize``: total size of compressed revisions in chain
                  :``chainratio``: total chain size divided by uncompressed revision size
                                  (new delta chains typically start at ratio 2.00)
                  :``lindist``:   linear distance from base revision in delta chain to end
                                  of this revision
                  :``extradist``: total size of revisions not part of this delta chain from
                                  base of delta chain to end of this revision; a measurement
                                  of how much extra data we need to read/seek across to read
                                  the delta chain for this revision
                  :``extraratio``: extradist divided by chainsize; another representation of
                                  how much unrelated data is needed to load this delta chain
                  If the repository is configured to use the sparse read, additional keywords
                  are available:
                  :``readsize``:     total size of data read from the disk for a revision
                                     (sum of the sizes of all the blocks)
                  :``largestblock``: size of the largest block of data read from the disk
                  :``readdensity``:  density of useful bytes in the data read from the disk
                  :``srchunks``:  in how many data hunks the whole revision would be read
                  The sparse read can be enabled with experimental.sparse-read = True
                  """
                  opts = pycompat.byteskwargs(opts)
                  r = cmdutil.openrevlog(repo, 'debugdeltachain', file_, opts)
                  index = r.index
                  start = r.start
                  length = r.length
                  generaldelta = r.version & revlog.FLAG_GENERALDELTA
                  withsparseread = getattr(r, '_withsparseread', False)
                  def revinfo(rev):
                      e = index[rev]
                      compsize = e[1]
                      uncompsize = e[2]
                      chainsize = 0
                      if generaldelta:
                          if e[3] == e[5]:
                              deltatype = 'p1'
                          elif e[3] == e[6]:
                              deltatype = 'p2'
                          elif e[3] == rev - 1:
                              deltatype = 'prev'
                          elif e[3] == rev:
                              deltatype = 'base'
                          else:
                              deltatype = 'other'
                      else:
                          if e[3] == rev:
                              deltatype = 'base'
                          else:
                              deltatype = 'prev'
                      chain = r._deltachain(rev)[0]
                      for iterrev in chain:
                          e = index[iterrev]
                          chainsize += e[1]
                      return compsize, uncompsize, deltatype, chain, chainsize
                  fm = ui.formatter('debugdeltachain', opts)
                  fm.plain('    rev  chain# chainlen     prev   delta       '
                           'size    rawsize  chainsize     ratio   lindist extradist '
                           'extraratio')
                  if withsparseread:
                      fm.plain('   readsize largestblk rddensity srchunks')
                  fm.plain('\n')
                  chainbases = {}
                  for rev in r:
                      comp, uncomp, deltatype, chain, chainsize = revinfo(rev)
                      chainbase = chain[0]
                      chainid = chainbases.setdefault(chainbase, len(chainbases) + 1)
                      basestart = start(chainbase)
                      revstart = start(rev)
                      lineardist = revstart + comp - basestart
                      extradist = lineardist - chainsize
                      try:
                          prevrev = chain[-2]
                      except IndexError:
                          prevrev = -1
                      if uncomp != 0:
                          chainratio = float(chainsize) / float(uncomp)
                      else:
                          chainratio = chainsize
                      if chainsize != 0:
                          extraratio = float(extradist) / float(chainsize)
                      else:
                          extraratio = extradist
                      fm.startitem()
                      fm.write('rev chainid chainlen prevrev deltatype compsize '
                               'uncompsize chainsize chainratio lindist extradist '
                               'extraratio',
                               '%7d %7d %8d %8d %7s %10d %10d %10d %9.5f %9d %9d %10.5f',
                               rev, chainid, len(chain), prevrev, deltatype, comp,
                               uncomp, chainsize, chainratio, lineardist, extradist,
                               extraratio,
                               rev=rev, chainid=chainid, chainlen=len(chain),
                               prevrev=prevrev, deltatype=deltatype, compsize=comp,
                               uncompsize=uncomp, chainsize=chainsize,
                               chainratio=chainratio, lindist=lineardist,
                               extradist=extradist, extraratio=extraratio)
                      if withsparseread:
                          readsize = 0
                          largestblock = 0
                          srchunks = 0
-                         for revschunk in revlog._slicechunk(r, chain):
+                         for revschunk in deltautil.slicechunk(r, chain):
                              srchunks += 1
                              blkend = start(revschunk[-1]) + length(revschunk[-1])
                              blksize = blkend - start(revschunk[0])
                              readsize += blksize
                              if largestblock < blksize:
                                  largestblock = blksize
                          if readsize:
                              readdensity = float(chainsize) / float(readsize)
                          else:
                              readdensity = 1
                          fm.write('readsize largestblock readdensity srchunks',
                                   ' %10d %10d %9.5f %8d',
                                   readsize, largestblock, readdensity, srchunks,
                                   readsize=readsize, largestblock=largestblock,
                                   readdensity=readdensity, srchunks=srchunks)
                      fm.plain('\n')
                  fm.end()
              @command('debugdirstate|debugstate',
                  [('', 'nodates', None, _('do not display the saved mtime')),
                  ('', 'datesort', None, _('sort by saved mtime'))],
                  _('[OPTION]...'))
              def debugstate(ui, repo, **opts):
                  """show the contents of the current dirstate"""
                  nodates = opts.get(r'nodates')
                  datesort = opts.get(r'datesort')
                  timestr = ""
                  if datesort:
                      keyfunc = lambda x: (x[1][3], x[0]) # sort by mtime, then by filename
                  else:
                      keyfunc = None # sort by filename
                  for file_, ent in sorted(repo.dirstate._map.iteritems(), key=keyfunc):
                      if ent[3] == -1:
                          timestr = 'unset               '
                      elif nodates:
                          timestr = 'set                 '
                      else:
                          timestr = time.strftime(r"%Y-%m-%d %H:%M:%S ",
                                                  time.localtime(ent[3]))
                          timestr = encoding.strtolocal(timestr)
                      if ent[1] & 0o20000:
                          mode = 'lnk'
                      else:
                          mode = '%3o' % (ent[1] & 0o777 & ~util.umask)
                      ui.write("%c %s %10d %s%s\n" % (ent[0], mode, ent[2], timestr, file_))
                  for f in repo.dirstate.copies():
                      ui.write(_("copy: %s -> %s\n") % (repo.dirstate.copied(f), f))
              @command('debugdiscovery',
                  [('', 'old', None, _('use old-style discovery')),
                  ('', 'nonheads', None,
                   _('use old-style discovery with non-heads included')),
                  ('', 'rev', [], 'restrict discovery to this set of revs'),
                  ] + cmdutil.remoteopts,
                  _('[--rev REV] [OTHER]'))
              def debugdiscovery(ui, repo, remoteurl="default", **opts):
                  """runs the changeset discovery protocol in isolation"""
                  opts = pycompat.byteskwargs(opts)
                  remoteurl, branches = hg.parseurl(ui.expandpath(remoteurl))
                  remote = hg.peer(repo, opts, remoteurl)
                  ui.status(_('comparing with %s\n') % util.hidepassword(remoteurl))
                  # make sure tests are repeatable
                  random.seed(12323)
                  def doit(pushedrevs, remoteheads, remote=remote):
                      if opts.get('old'):
                          if not util.safehasattr(remote, 'branches'):
                              # enable in-client legacy support
                              remote = localrepo.locallegacypeer(remote.local())
                          common, _in, hds = treediscovery.findcommonincoming(repo, remote,
                                                                              force=True)
                          common = set(common)
                          if not opts.get('nonheads'):
                              ui.write(("unpruned common: %s\n") %
                                       " ".join(sorted(short(n) for n in common)))
                              clnode = repo.changelog.node
                              common = repo.revs('heads(::%ln)', common)
                              common = {clnode(r) for r in common}
                      else:
                          nodes = None
                          if pushedrevs:
                              revs = scmutil.revrange(repo, pushedrevs)
                              nodes = [repo[r].node() for r in revs]
                          common, any, hds = setdiscovery.findcommonheads(ui, repo, remote,
                                                                          ancestorsof=nodes)
                      common = set(common)
                      rheads = set(hds)
                      lheads = set(repo.heads())
                      ui.write(("common heads: %s\n") %
                               " ".join(sorted(short(n) for n in common)))
                      if lheads <= common:
                          ui.write(("local is subset\n"))
                      elif rheads <= common:
                          ui.write(("remote is subset\n"))
                  remoterevs, _checkout = hg.addbranchrevs(repo, remote, branches, revs=None)
                  localrevs = opts['rev']
                  doit(localrevs, remoterevs)
              _chunksize = 4 << 10
              @command('debugdownload',
                  [
                      ('o', 'output', '', _('path')),
                  ],
                  optionalrepo=True)
              def debugdownload(ui, repo, url, output=None, **opts):
                  """download a resource using Mercurial logic and config
                  """
                  fh = urlmod.open(ui, url, output)
                  dest = ui
                  if output:
                      dest = open(output, "wb", _chunksize)
                  try:
                      data = fh.read(_chunksize)
                      while data:
                          dest.write(data)
                          data = fh.read(_chunksize)
                  finally:
                      if output:
                          dest.close()
              @command('debugextensions', cmdutil.formatteropts, [], optionalrepo=True)
              def debugextensions(ui, repo, **opts):
                  '''show information about active extensions'''
                  opts = pycompat.byteskwargs(opts)
                  exts = extensions.extensions(ui)
                  hgver = util.version()
                  fm = ui.formatter('debugextensions', opts)
                  for extname, extmod in sorted(exts, key=operator.itemgetter(0)):
                      isinternal = extensions.ismoduleinternal(extmod)
                      extsource = pycompat.fsencode(extmod.__file__)
                      if isinternal:
                          exttestedwith = []  # never expose magic string to users
                      else:
                          exttestedwith = getattr(extmod, 'testedwith', '').split()
                      extbuglink = getattr(extmod, 'buglink', None)
                      fm.startitem()
                      if ui.quiet or ui.verbose:
                          fm.write('name', '%s\n', extname)
                      else:
                          fm.write('name', '%s', extname)
                          if isinternal or hgver in exttestedwith:
                              fm.plain('\n')
                          elif not exttestedwith:
                              fm.plain(_(' (untested!)\n'))
                          else:
                              lasttestedversion = exttestedwith[-1]
                              fm.plain(' (%s!)\n' % lasttestedversion)
                      fm.condwrite(ui.verbose and extsource, 'source',
                               _('  location: %s\n'), extsource or "")
                      if ui.verbose:
                          fm.plain(_('  bundled: %s\n') % ['no', 'yes'][isinternal])
                      fm.data(bundled=isinternal)
                      fm.condwrite(ui.verbose and exttestedwith, 'testedwith',
                                   _('  tested with: %s\n'),
                                   fm.formatlist(exttestedwith, name='ver'))
                      fm.condwrite(ui.verbose and extbuglink, 'buglink',
                               _('  bug reporting: %s\n'), extbuglink or "")
                  fm.end()
              @command('debugfileset',
                  [('r', 'rev', '', _('apply the filespec on this revision'), _('REV')),
                   ('', 'all-files', False,
                    _('test files from all revisions and working directory')),
                   ('s', 'show-matcher', None,
                    _('print internal representation of matcher')),
                   ('p', 'show-stage', [],
                    _('print parsed tree at the given stage'), _('NAME'))],
                  _('[-r REV] [--all-files] [OPTION]... FILESPEC'))
              def debugfileset(ui, repo, expr, **opts):
                  '''parse and apply a fileset specification'''
                  from . import fileset
                  fileset.symbols # force import of fileset so we have predicates to optimize
                  opts = pycompat.byteskwargs(opts)
                  ctx = scmutil.revsingle(repo, opts.get('rev'), None)
                  stages = [
                      ('parsed', pycompat.identity),
                      ('analyzed', filesetlang.analyze),
                      ('optimized', filesetlang.optimize),
                  ]
                  stagenames = set(n for n, f in stages)
                  showalways = set()
                  if ui.verbose and not opts['show_stage']:
                      # show parsed tree by --verbose (deprecated)
                      showalways.add('parsed')
                  if opts['show_stage'] == ['all']:
                      showalways.update(stagenames)
                  else:
                      for n in opts['show_stage']:
                          if n not in stagenames:
                              raise error.Abort(_('invalid stage name: %s') % n)
                      showalways.update(opts['show_stage'])
                  tree = filesetlang.parse(expr)
                  for n, f in stages:
                      tree = f(tree)
                      if n in showalways:
                          if opts['show_stage'] or n != 'parsed':
                              ui.write(("* %s:\n") % n)
                          ui.write(filesetlang.prettyformat(tree), "\n")
                  files = set()
                  if opts['all_files']:
                      for r in repo:
                          c = repo[r]
                          files.update(c.files())
                          files.update(c.substate)
                  if opts['all_files'] or ctx.rev() is None:
                      wctx = repo[None]
                      files.update(repo.dirstate.walk(scmutil.matchall(repo),
                                                      subrepos=list(wctx.substate),
                                                      unknown=True, ignored=True))
                      files.update(wctx.substate)
                  else:
                      files.update(ctx.files())
                      files.update(ctx.substate)
                  m = ctx.matchfileset(expr)
                  if opts['show_matcher'] or (opts['show_matcher'] is None and ui.verbose):
                      ui.write(('* matcher:\n'), stringutil.prettyrepr(m), '\n')
                  for f in sorted(files):
                      if not m(f):
                          continue
                      ui.write("%s\n" % f)
              @command('debugformat',
                       [] + cmdutil.formatteropts)
              def debugformat(ui, repo, **opts):
                  """display format information about the current repository
                  Use --verbose to get extra information about current config value and
                  Mercurial default."""
                  opts = pycompat.byteskwargs(opts)
                  maxvariantlength = max(len(fv.name) for fv in upgrade.allformatvariant)
                  maxvariantlength = max(len('format-variant'), maxvariantlength)
                  def makeformatname(name):
                      return '%s:' + (' ' * (maxvariantlength - len(name)))
                  fm = ui.formatter('debugformat', opts)
                  if fm.isplain():
                      def formatvalue(value):
                          if util.safehasattr(value, 'startswith'):
                              return value
                          if value:
                              return 'yes'
                          else:
                              return 'no'
                  else:
                      formatvalue = pycompat.identity
                  fm.plain('format-variant')
                  fm.plain(' ' * (maxvariantlength - len('format-variant')))
                  fm.plain(' repo')
                  if ui.verbose:
                      fm.plain(' config default')
                  fm.plain('\n')
                  for fv in upgrade.allformatvariant:
                      fm.startitem()
                      repovalue = fv.fromrepo(repo)
                      configvalue = fv.fromconfig(repo)
                      if repovalue != configvalue:
                          namelabel = 'formatvariant.name.mismatchconfig'
                          repolabel = 'formatvariant.repo.mismatchconfig'
                      elif repovalue != fv.default:
                          namelabel = 'formatvariant.name.mismatchdefault'
                          repolabel = 'formatvariant.repo.mismatchdefault'
                      else:
                          namelabel = 'formatvariant.name.uptodate'
                          repolabel = 'formatvariant.repo.uptodate'
                      fm.write('name', makeformatname(fv.name), fv.name,
                               label=namelabel)
                      fm.write('repo', ' %3s', formatvalue(repovalue),
                               label=repolabel)
                      if fv.default != configvalue:
                          configlabel = 'formatvariant.config.special'
                      else:
                          configlabel = 'formatvariant.config.default'
                      fm.condwrite(ui.verbose, 'config', ' %6s', formatvalue(configvalue),
                                   label=configlabel)
                      fm.condwrite(ui.verbose, 'default', ' %7s', formatvalue(fv.default),
                                   label='formatvariant.default')
                      fm.plain('\n')
                  fm.end()
              @command('debugfsinfo', [], _('[PATH]'), norepo=True)
              def debugfsinfo(ui, path="."):
                  """show information detected about current filesystem"""
                  ui.write(('path: %s\n') % path)
                  ui.write(('mounted on: %s\n') % (util.getfsmountpoint(path) or '(unknown)'))
                  ui.write(('exec: %s\n') % (util.checkexec(path) and 'yes' or 'no'))
                  ui.write(('fstype: %s\n') % (util.getfstype(path) or '(unknown)'))
                  ui.write(('symlink: %s\n') % (util.checklink(path) and 'yes' or 'no'))
                  ui.write(('hardlink: %s\n') % (util.checknlink(path) and 'yes' or 'no'))
                  casesensitive = '(unknown)'
                  try:
                      with pycompat.namedtempfile(prefix='.debugfsinfo', dir=path) as f:
                          casesensitive = util.fscasesensitive(f.name) and 'yes' or 'no'
                  except OSError:
                      pass
                  ui.write(('case-sensitive: %s\n') % casesensitive)
              @command('debuggetbundle',
                  [('H', 'head', [], _('id of head node'), _('ID')),
                  ('C', 'common', [], _('id of common node'), _('ID')),
                  ('t', 'type', 'bzip2', _('bundle compression type to use'), _('TYPE'))],
                  _('REPO FILE [-H|-C ID]...'),
                  norepo=True)
              def debuggetbundle(ui, repopath, bundlepath, head=None, common=None, **opts):
                  """retrieves a bundle from a repo
                  Every ID must be a full-length hex node id string. Saves the bundle to the
                  given file.
                  """
                  opts = pycompat.byteskwargs(opts)
                  repo = hg.peer(ui, opts, repopath)
                  if not repo.capable('getbundle'):
                      raise error.Abort("getbundle() not supported by target repository")
                  args = {}
                  if common:
                      args[r'common'] = [bin(s) for s in common]
                  if head:
                      args[r'heads'] = [bin(s) for s in head]
                  # TODO: get desired bundlecaps from command line.
                  args[r'bundlecaps'] = None
                  bundle = repo.getbundle('debug', **args)
                  bundletype = opts.get('type', 'bzip2').lower()
                  btypes = {'none': 'HG10UN',
                            'bzip2': 'HG10BZ',
                            'gzip': 'HG10GZ',
                            'bundle2': 'HG20'}
                  bundletype = btypes.get(bundletype)
                  if bundletype not in bundle2.bundletypes:
                      raise error.Abort(_('unknown bundle type specified with --type'))
                  bundle2.writebundle(ui, bundle, bundlepath, bundletype)
              @command('debugignore', [], '[FILE]')
              def debugignore(ui, repo, *files, **opts):
                  """display the combined ignore pattern and information about ignored files
                  With no argument display the combined ignore pattern.
                  Given space separated file names, shows if the given file is ignored and
                  if so, show the ignore rule (file and line number) that matched it.
                  """
                  ignore = repo.dirstate._ignore
                  if not files:
                      # Show all the patterns
                      ui.write("%s\n" % pycompat.byterepr(ignore))
                  else:
                      m = scmutil.match(repo[None], pats=files)
                      for f in m.files():
                          nf = util.normpath(f)
                          ignored = None
                          ignoredata = None
                          if nf != '.':
                              if ignore(nf):
                                  ignored = nf
                                  ignoredata = repo.dirstate._ignorefileandline(nf)
                              else:
                                  for p in util.finddirs(nf):
                                      if ignore(p):
                                          ignored = p
                                          ignoredata = repo.dirstate._ignorefileandline(p)
                                          break
                          if ignored:
                              if ignored == nf:
                                  ui.write(_("%s is ignored\n") % m.uipath(f))
                              else:
                                  ui.write(_("%s is ignored because of "
                                             "containing folder %s\n")
                                           % (m.uipath(f), ignored))
                              ignorefile, lineno, line = ignoredata
                              ui.write(_("(ignore rule in %s, line %d: '%s')\n")
                                       % (ignorefile, lineno, line))
                          else:
                              ui.write(_("%s is not ignored\n") % m.uipath(f))
              @command('debugindex', cmdutil.debugrevlogopts + cmdutil.formatteropts,
                       _('-c|-m|FILE'))
              def debugindex(ui, repo, file_=None, **opts):
                  """dump index data for a storage primitive"""
                  opts = pycompat.byteskwargs(opts)
                  store = cmdutil.openstorage(repo, 'debugindex', file_, opts)
                  if ui.debugflag:
                      shortfn = hex
                  else:
                      shortfn = short
                  idlen = 12
                  for i in store:
                      idlen = len(shortfn(store.node(i)))
                      break
                  fm = ui.formatter('debugindex', opts)
                  fm.plain(b'   rev linkrev %s %s p2\n' % (
                      b'nodeid'.ljust(idlen),
                      b'p1'.ljust(idlen)))
                  for rev in store:
                      node = store.node(rev)
                      parents = store.parents(node)
                      fm.startitem()
                      fm.write(b'rev', b'%6d ', rev)
                      fm.write(b'linkrev', '%7d ', store.linkrev(rev))
                      fm.write(b'node', '%s ', shortfn(node))
                      fm.write(b'p1', '%s ', shortfn(parents[0]))
                      fm.write(b'p2', '%s', shortfn(parents[1]))
                      fm.plain(b'\n')
                  fm.end()
              @command('debugindexdot', cmdutil.debugrevlogopts,
                  _('-c|-m|FILE'), optionalrepo=True)
              def debugindexdot(ui, repo, file_=None, **opts):
                  """dump an index DAG as a graphviz dot file"""
                  opts = pycompat.byteskwargs(opts)
                  r = cmdutil.openstorage(repo, 'debugindexdot', file_, opts)
                  ui.write(("digraph G {\n"))
                  for i in r:
                      node = r.node(i)
                      pp = r.parents(node)
                      ui.write("\t%d -> %d\n" % (r.rev(pp[0]), i))
                      if pp[1] != nullid:
                          ui.write("\t%d -> %d\n" % (r.rev(pp[1]), i))
                  ui.write("}\n")
              @command('debuginstall', [] + cmdutil.formatteropts, '', norepo=True)
              def debuginstall(ui, **opts):
                  '''test Mercurial installation
                  Returns 0 on success.
                  '''
                  opts = pycompat.byteskwargs(opts)
                  def writetemp(contents):
                      (fd, name) = pycompat.mkstemp(prefix="hg-debuginstall-")
                      f = os.fdopen(fd, r"wb")
                      f.write(contents)
                      f.close()
                      return name
                  problems = 0
                  fm = ui.formatter('debuginstall', opts)
                  fm.startitem()
                  # encoding
                  fm.write('encoding', _("checking encoding (%s)...\n"), encoding.encoding)
                  err = None
                  try:
                      codecs.lookup(pycompat.sysstr(encoding.encoding))
                  except LookupError as inst:
                      err = stringutil.forcebytestr(inst)
                      problems += 1
                  fm.condwrite(err, 'encodingerror', _(" %s\n"
                               " (check that your locale is properly set)\n"), err)
                  # Python
                  fm.write('pythonexe', _("checking Python executable (%s)\n"),
                           pycompat.sysexecutable)
                  fm.write('pythonver', _("checking Python version (%s)\n"),
                           ("%d.%d.%d" % sys.version_info[:3]))
                  fm.write('pythonlib', _("checking Python lib (%s)...\n"),
                           os.path.dirname(pycompat.fsencode(os.__file__)))
                  security = set(sslutil.supportedprotocols)
                  if sslutil.hassni:
                      security.add('sni')
                  fm.write('pythonsecurity', _("checking Python security support (%s)\n"),
                           fm.formatlist(sorted(security), name='protocol',
                                         fmt='%s', sep=','))
                  # These are warnings, not errors. So don't increment problem count. This
                  # may change in the future.
                  if 'tls1.2' not in security:
                      fm.plain(_('  TLS 1.2 not supported by Python install; '
                                 'network connections lack modern security\n'))
                  if 'sni' not in security:
                      fm.plain(_('  SNI not supported by Python install; may have '
                                 'connectivity issues with some servers\n'))
                  # TODO print CA cert info
                  # hg version
                  hgver = util.version()
                  fm.write('hgver', _("checking Mercurial version (%s)\n"),
                           hgver.split('+')[0])
                  fm.write('hgverextra', _("checking Mercurial custom build (%s)\n"),
                           '+'.join(hgver.split('+')[1:]))
                  # compiled modules
                  fm.write('hgmodulepolicy', _("checking module policy (%s)\n"),
                           policy.policy)
                  fm.write('hgmodules', _("checking installed modules (%s)...\n"),
                           os.path.dirname(pycompat.fsencode(__file__)))
                  if policy.policy in ('c', 'allow'):
                      err = None
                      try:
                          from .cext import (
                              base85,
                              bdiff,
                              mpatch,
                              osutil,
                          )
                          dir(bdiff), dir(mpatch), dir(base85), dir(osutil) # quiet pyflakes
                      except Exception as inst:
                          err = stringutil.forcebytestr(inst)
                          problems += 1
                      fm.condwrite(err, 'extensionserror', " %s\n", err)
                  compengines = util.compengines._engines.values()
                  fm.write('compengines', _('checking registered compression engines (%s)\n'),
                           fm.formatlist(sorted(e.name() for e in compengines),
                                         name='compengine', fmt='%s', sep=', '))
                  fm.write('compenginesavail', _('checking available compression engines '
                                                 '(%s)\n'),
                           fm.formatlist(sorted(e.name() for e in compengines
                                                if e.available()),
                                         name='compengine', fmt='%s', sep=', '))
                  wirecompengines = util.compengines.supportedwireengines(util.SERVERROLE)
                  fm.write('compenginesserver', _('checking available compression engines '
                                                  'for wire protocol (%s)\n'),
                           fm.formatlist([e.name() for e in wirecompengines
                                          if e.wireprotosupport()],
                                         name='compengine', fmt='%s', sep=', '))
                  re2 = 'missing'
                  if util._re2:
                      re2 = 'available'
                  fm.plain(_('checking "re2" regexp engine (%s)\n') % re2)
                  fm.data(re2=bool(util._re2))
                  # templates
                  p = templater.templatepaths()
                  fm.write('templatedirs', 'checking templates (%s)...\n', ' '.join(p))
                  fm.condwrite(not p, '', _(" no template directories found\n"))
                  if p:
                      m = templater.templatepath("map-cmdline.default")
                      if m:
                          # template found, check if it is working
                          err = None
                          try:
                              templater.templater.frommapfile(m)
                          except Exception as inst:
                              err = stringutil.forcebytestr(inst)
                              p = None
                          fm.condwrite(err, 'defaulttemplateerror', " %s\n", err)
                      else:
                          p = None
                      fm.condwrite(p, 'defaulttemplate',
                                   _("checking default template (%s)\n"), m)
                      fm.condwrite(not m, 'defaulttemplatenotfound',
                                   _(" template '%s' not found\n"), "default")
                  if not p:
                      problems += 1
                  fm.condwrite(not p, '',
                               _(" (templates seem to have been installed incorrectly)\n"))
                  # editor
                  editor = ui.geteditor()
                  editor = util.expandpath(editor)
                  editorbin = procutil.shellsplit(editor)[0]
                  fm.write('editor', _("checking commit editor... (%s)\n"), editorbin)
                  cmdpath = procutil.findexe(editorbin)
                  fm.condwrite(not cmdpath and editor == 'vi', 'vinotfound',
                               _(" No commit editor set and can't find %s in PATH\n"
                                 " (specify a commit editor in your configuration"
                                 " file)\n"), not cmdpath and editor == 'vi' and editorbin)
                  fm.condwrite(not cmdpath and editor != 'vi', 'editornotfound',
                               _(" Can't find editor '%s' in PATH\n"
                                 " (specify a commit editor in your configuration"
                                 " file)\n"), not cmdpath and editorbin)
                  if not cmdpath and editor != 'vi':
                      problems += 1
                  # check username
                  username = None
                  err = None
                  try:
                      username = ui.username()
                  except error.Abort as e:
                      err = stringutil.forcebytestr(e)
                      problems += 1
                  fm.condwrite(username, 'username',  _("checking username (%s)\n"), username)
                  fm.condwrite(err, 'usernameerror', _("checking username...\n %s\n"
                      " (specify a username in your configuration file)\n"), err)
                  fm.condwrite(not problems, '',
                               _("no problems detected\n"))
                  if not problems:
                      fm.data(problems=problems)
                  fm.condwrite(problems, 'problems',
                               _("%d problems detected,"
                                 " please check your install!\n"), problems)
                  fm.end()
                  return problems
              @command('debugknown', [], _('REPO ID...'), norepo=True)
              def debugknown(ui, repopath, *ids, **opts):
                  """test whether node ids are known to a repo
                  Every ID must be a full-length hex node id string. Returns a list of 0s
                  and 1s indicating unknown/known.
                  """
                  opts = pycompat.byteskwargs(opts)
                  repo = hg.peer(ui, opts, repopath)
                  if not repo.capable('known'):
                      raise error.Abort("known() not supported by target repository")
                  flags = repo.known([bin(s) for s in ids])
                  ui.write("%s\n" % ("".join([f and "1" or "0" for f in flags])))
              @command('debuglabelcomplete', [], _('LABEL...'))
              def debuglabelcomplete(ui, repo, *args):
                  '''backwards compatibility with old bash completion scripts (DEPRECATED)'''
                  debugnamecomplete(ui, repo, *args)
              @command('debuglocks',
                       [('L', 'force-lock', None, _('free the store lock (DANGEROUS)')),
                        ('W', 'force-wlock', None,
                         _('free the working state lock (DANGEROUS)')),
                        ('s', 'set-lock', None, _('set the store lock until stopped')),
                        ('S', 'set-wlock', None,
                         _('set the working state lock until stopped'))],
                       _('[OPTION]...'))
              def debuglocks(ui, repo, **opts):
                  """show or modify state of locks
                  By default, this command will show which locks are held. This
                  includes the user and process holding the lock, the amount of time
                  the lock has been held, and the machine name where the process is
                  running if it's not local.
                  Locks protect the integrity of Mercurial's data, so should be
                  treated with care. System crashes or other interruptions may cause
                  locks to not be properly released, though Mercurial will usually
                  detect and remove such stale locks automatically.
                  However, detecting stale locks may not always be possible (for
                  instance, on a shared filesystem). Removing locks may also be
                  blocked by filesystem permissions.
                  Setting a lock will prevent other commands from changing the data.
                  The command will wait until an interruption (SIGINT, SIGTERM, ...) occurs.
                  The set locks are removed when the command exits.
                  Returns 0 if no locks are held.
                  """
                  if opts.get(r'force_lock'):
                      repo.svfs.unlink('lock')
                  if opts.get(r'force_wlock'):
                      repo.vfs.unlink('wlock')
                  if opts.get(r'force_lock') or opts.get(r'force_wlock'):
                      return 0
                  locks = []
                  try:
                      if opts.get(r'set_wlock'):
                          try:
                              locks.append(repo.wlock(False))
                          except error.LockHeld:
                              raise error.Abort(_('wlock is already held'))
                      if opts.get(r'set_lock'):
                          try:
                              locks.append(repo.lock(False))
                          except error.LockHeld:
                              raise error.Abort(_('lock is already held'))
                      if len(locks):
                          ui.promptchoice(_("ready to release the lock (y)? $$ &Yes"))
                          return 0
                  finally:
                      release(*locks)
                  now = time.time()
                  held = 0
                  def report(vfs, name, method):
                      # this causes stale locks to get reaped for more accurate reporting
                      try:
                          l = method(False)
                      except error.LockHeld:
                          l = None
                      if l:
                          l.release()
                      else:
                          try:
                              st = vfs.lstat(name)
                              age = now - st[stat.ST_MTIME]
                              user = util.username(st.st_uid)
                              locker = vfs.readlock(name)
                              if ":" in locker:
                                  host, pid = locker.split(':')
                                  if host == socket.gethostname():
                                      locker = 'user %s, process %s' % (user, pid)
                                  else:
                                      locker = 'user %s, process %s, host %s' \
                                               % (user, pid, host)
                              ui.write(("%-6s %s (%ds)\n") % (name + ":", locker, age))
                              return 1
                          except OSError as e:
                              if e.errno != errno.ENOENT:
                                  raise
                      ui.write(("%-6s free\n") % (name + ":"))
                      return 0
                  held += report(repo.svfs, "lock", repo.lock)
                  held += report(repo.vfs, "wlock", repo.wlock)
                  return held
              @command('debugmanifestfulltextcache', [
                      ('', 'clear', False, _('clear the cache')),
                      ('a', 'add', '', _('add the given manifest node to the cache'),
                       _('NODE'))
                  ], '')
              def debugmanifestfulltextcache(ui, repo, add=None, **opts):
                  """show, clear or amend the contents of the manifest fulltext cache"""
                  with repo.lock():
                      r = repo.manifestlog.getstorage(b'')
                      try:
                          cache = r._fulltextcache
                      except AttributeError:
                          ui.warn(_(
                              "Current revlog implementation doesn't appear to have a "
                              'manifest fulltext cache\n'))
                          return
                      if opts.get(r'clear'):
                          cache.clear()
                      if add:
                          try:
                              manifest = repo.manifestlog[r.lookup(add)]
                          except error.LookupError as e:
                              raise error.Abort(e, hint="Check your manifest node id")
                          manifest.read()  # stores revisision in cache too
                      if not len(cache):
                          ui.write(_('Cache empty'))
                      else:
                          ui.write(
                              _('Cache contains %d manifest entries, in order of most to '
                                'least recent:\n') % (len(cache),))
                          totalsize = 0
                          for nodeid in cache:
                              # Use cache.get to not update the LRU order
                              data = cache.get(nodeid)
                              size = len(data)
                              totalsize += size + 24   # 20 bytes nodeid, 4 bytes size
                              ui.write(_('id: %s, size %s\n') % (
                                  hex(nodeid), util.bytecount(size)))
                          ondisk = cache._opener.stat('manifestfulltextcache').st_size
                          ui.write(
                              _('Total cache data size %s, on-disk %s\n') % (
                                  util.bytecount(totalsize), util.bytecount(ondisk))
                          )
              @command('debugmergestate', [], '')
              def debugmergestate(ui, repo, *args):
                  """print merge state
                  Use --verbose to print out information about whether v1 or v2 merge state
                  was chosen."""
                  def _hashornull(h):
                      if h == nullhex:
                          return 'null'
                      else:
                          return h
                  def printrecords(version):
                      ui.write(('* version %d records\n') % version)
                      if version == 1:
                          records = v1records
                      else:
                          records = v2records
                      for rtype, record in records:
                          # pretty print some record types
                          if rtype == 'L':
                              ui.write(('local: %s\n') % record)
                          elif rtype == 'O':
                              ui.write(('other: %s\n') % record)
                          elif rtype == 'm':
                              driver, mdstate = record.split('\0', 1)
                              ui.write(('merge driver: %s (state "%s")\n')
                                       % (driver, mdstate))
                          elif rtype in 'FDC':
                              r = record.split('\0')
                              f, state, hash, lfile, afile, anode, ofile = r[0:7]
                              if version == 1:
                                  onode = 'not stored in v1 format'
                                  flags = r[7]
                              else:
                                  onode, flags = r[7:9]
                              ui.write(('file: %s (record type "%s", state "%s", hash %s)\n')
                                       % (f, rtype, state, _hashornull(hash)))
                              ui.write(('  local path: %s (flags "%s")\n') % (lfile, flags))
                              ui.write(('  ancestor path: %s (node %s)\n')
                                       % (afile, _hashornull(anode)))
                              ui.write(('  other path: %s (node %s)\n')
                                       % (ofile, _hashornull(onode)))
                          elif rtype == 'f':
                              filename, rawextras = record.split('\0', 1)
                              extras = rawextras.split('\0')
                              i = 0
                              extrastrings = []
                              while i < len(extras):
                                  extrastrings.append('%s = %s' % (extras[i], extras[i + 1]))
                                  i += 2
                              ui.write(('file extras: %s (%s)\n')
                                       % (filename, ', '.join(extrastrings)))
                          elif rtype == 'l':
                              labels = record.split('\0', 2)
                              labels = [l for l in labels if len(l) > 0]
                              ui.write(('labels:\n'))
                              ui.write(('  local: %s\n' % labels[0]))
                              ui.write(('  other: %s\n' % labels[1]))
                              if len(labels) > 2:
                                  ui.write(('  base:  %s\n' % labels[2]))
                          else:
                              ui.write(('unrecognized entry: %s\t%s\n')
                                       % (rtype, record.replace('\0', '\t')))
                  # Avoid mergestate.read() since it may raise an exception for unsupported
                  # merge state records. We shouldn't be doing this, but this is OK since this
                  # command is pretty low-level.
                  ms = mergemod.mergestate(repo)
                  # sort so that reasonable information is on top
                  v1records = ms._readrecordsv1()
                  v2records = ms._readrecordsv2()
                  order = 'LOml'
                  def key(r):
                      idx = order.find(r[0])
                      if idx == -1:
                          return (1, r[1])
                      else:
                          return (0, idx)
                  v1records.sort(key=key)
                  v2records.sort(key=key)
                  if not v1records and not v2records:
                      ui.write(('no merge state found\n'))
                  elif not v2records:
                      ui.note(('no version 2 merge state\n'))
                      printrecords(1)
                  elif ms._v1v2match(v1records, v2records):
                      ui.note(('v1 and v2 states match: using v2\n'))
                      printrecords(2)
                  else:
                      ui.note(('v1 and v2 states mismatch: using v1\n'))
                      printrecords(1)
                      if ui.verbose:
                          printrecords(2)
              @command('debugnamecomplete', [], _('NAME...'))
              def debugnamecomplete(ui, repo, *args):
                  '''complete "names" - tags, open branch names, bookmark names'''
                  names = set()
                  # since we previously only listed open branches, we will handle that
                  # specially (after this for loop)
                  for name, ns in repo.names.iteritems():
                      if name != 'branches':
                          names.update(ns.listnames(repo))
                  names.update(tag for (tag, heads, tip, closed)
                               in repo.branchmap().iterbranches() if not closed)
                  completions = set()
                  if not args:
                      args = ['']
                  for a in args:
                      completions.update(n for n in names if n.startswith(a))
                  ui.write('\n'.join(sorted(completions)))
                  ui.write('\n')
              @command('debugobsolete',
                      [('', 'flags', 0, _('markers flag')),
                       ('', 'record-parents', False,
                        _('record parent information for the precursor')),
                       ('r', 'rev', [], _('display markers relevant to REV')),
                       ('', 'exclusive', False, _('restrict display to markers only '
                                                  'relevant to REV')),
                       ('', 'index', False, _('display index of the marker')),
                       ('', 'delete', [], _('delete markers specified by indices')),
                      ] + cmdutil.commitopts2 + cmdutil.formatteropts,
                       _('[OBSOLETED [REPLACEMENT ...]]'))
              def debugobsolete(ui, repo, precursor=None, *successors, **opts):
                  """create arbitrary obsolete marker
                  With no arguments, displays the list of obsolescence markers."""
                  opts = pycompat.byteskwargs(opts)
                  def parsenodeid(s):
                      try:
                          # We do not use revsingle/revrange functions here to accept
                          # arbitrary node identifiers, possibly not present in the
                          # local repository.
                          n = bin(s)
                          if len(n) != len(nullid):
                              raise TypeError()
                          return n
                      except TypeError:
                          raise error.Abort('changeset references must be full hexadecimal '
                                           'node identifiers')
                  if opts.get('delete'):
                      indices = []
                      for v in opts.get('delete'):
                          try:
                              indices.append(int(v))
                          except ValueError:
                              raise error.Abort(_('invalid index value: %r') % v,
                                                hint=_('use integers for indices'))
                      if repo.currenttransaction():
                          raise error.Abort(_('cannot delete obsmarkers in the middle '
                                              'of transaction.'))
                      with repo.lock():
                          n = repair.deleteobsmarkers(repo.obsstore, indices)
                          ui.write(_('deleted %i obsolescence markers\n') % n)
                      return
                  if precursor is not None:
                      if opts['rev']:
                          raise error.Abort('cannot select revision when creating marker')
                      metadata = {}
                      metadata['user'] = encoding.fromlocal(opts['user'] or ui.username())
                      succs = tuple(parsenodeid(succ) for succ in successors)
                      l = repo.lock()
                      try:
                          tr = repo.transaction('debugobsolete')
                          try:
                              date = opts.get('date')
                              if date:
                                  date = dateutil.parsedate(date)
                              else:
                                  date = None
                              prec = parsenodeid(precursor)
                              parents = None
                              if opts['record_parents']:
                                  if prec not in repo.unfiltered():
                                      raise error.Abort('cannot used --record-parents on '
                                                       'unknown changesets')
                                  parents = repo.unfiltered()[prec].parents()
                                  parents = tuple(p.node() for p in parents)
                              repo.obsstore.create(tr, prec, succs, opts['flags'],
                                                   parents=parents, date=date,
                                                   metadata=metadata, ui=ui)
                              tr.close()
                          except ValueError as exc:
                              raise error.Abort(_('bad obsmarker input: %s') %
                                                pycompat.bytestr(exc))
                          finally:
                              tr.release()
                      finally:
                          l.release()
                  else:
                      if opts['rev']:
                          revs = scmutil.revrange(repo, opts['rev'])
                          nodes = [repo[r].node() for r in revs]
                          markers = list(obsutil.getmarkers(repo, nodes=nodes,
                                                             exclusive=opts['exclusive']))
                          markers.sort(key=lambda x: x._data)
                      else:
                          markers = obsutil.getmarkers(repo)
                      markerstoiter = markers
                      isrelevant = lambda m: True
                      if opts.get('rev') and opts.get('index'):
                          markerstoiter = obsutil.getmarkers(repo)
                          markerset = set(markers)
                          isrelevant = lambda m: m in markerset
                      fm = ui.formatter('debugobsolete', opts)
                      for i, m in enumerate(markerstoiter):
                          if not isrelevant(m):
                              # marker can be irrelevant when we're iterating over a set
                              # of markers (markerstoiter) which is bigger than the set
                              # of markers we want to display (markers)
                              # this can happen if both --index and --rev options are
                              # provided and thus we need to iterate over all of the markers
                              # to get the correct indices, but only display the ones that
                              # are relevant to --rev value
                              continue
                          fm.startitem()
                          ind = i if opts.get('index') else None
                          cmdutil.showmarker(fm, m, index=ind)
                      fm.end()
              @command('debugpathcomplete',
                       [('f', 'full', None, _('complete an entire path')),
                        ('n', 'normal', None, _('show only normal files')),
                        ('a', 'added', None, _('show only added files')),
                        ('r', 'removed', None, _('show only removed files'))],
                       _('FILESPEC...'))
              def debugpathcomplete(ui, repo, *specs, **opts):
                  '''complete part or all of a tracked path
                  This command supports shells that offer path name completion. It
                  currently completes only files already known to the dirstate.
                  Completion extends only to the next path segment unless
                  --full is specified, in which case entire paths are used.'''
                  def complete(path, acceptable):
                      dirstate = repo.dirstate
                      spec = os.path.normpath(os.path.join(pycompat.getcwd(), path))
                      rootdir = repo.root + pycompat.ossep
                      if spec != repo.root and not spec.startswith(rootdir):
                          return [], []
                      if os.path.isdir(spec):
                          spec += '/'
                      spec = spec[len(rootdir):]
                      fixpaths = pycompat.ossep != '/'
                      if fixpaths:
                          spec = spec.replace(pycompat.ossep, '/')
                      speclen = len(spec)
                      fullpaths = opts[r'full']
                      files, dirs = set(), set()
                      adddir, addfile = dirs.add, files.add
                      for f, st in dirstate.iteritems():
                          if f.startswith(spec) and st[0] in acceptable:
                              if fixpaths:
                                  f = f.replace('/', pycompat.ossep)
                              if fullpaths:
                                  addfile(f)
                                  continue
                              s = f.find(pycompat.ossep, speclen)
                              if s >= 0:
                                  adddir(f[:s])
                              else:
                                  addfile(f)
                      return files, dirs
                  acceptable = ''
                  if opts[r'normal']:
                      acceptable += 'nm'
                  if opts[r'added']:
                      acceptable += 'a'
                  if opts[r'removed']:
                      acceptable += 'r'
                  cwd = repo.getcwd()
                  if not specs:
                      specs = ['.']
                  files, dirs = set(), set()
                  for spec in specs:
                      f, d = complete(spec, acceptable or 'nmar')
                      files.update(f)
                      dirs.update(d)
                  files.update(dirs)
                  ui.write('\n'.join(repo.pathto(p, cwd) for p in sorted(files)))
                  ui.write('\n')
              @command('debugpeer', [], _('PATH'), norepo=True)
              def debugpeer(ui, path):
                  """establish a connection to a peer repository"""
                  # Always enable peer request logging. Requires --debug to display
                  # though.
                  overrides = {
                      ('devel', 'debug.peer-request'): True,
                  }
                  with ui.configoverride(overrides):
                      peer = hg.peer(ui, {}, path)
                      local = peer.local() is not None
                      canpush = peer.canpush()
                      ui.write(_('url: %s\n') % peer.url())
                      ui.write(_('local: %s\n') % (_('yes') if local else _('no')))
                      ui.write(_('pushable: %s\n') % (_('yes') if canpush else _('no')))
              @command('debugpickmergetool',
                      [('r', 'rev', '', _('check for files in this revision'), _('REV')),
                       ('', 'changedelete', None, _('emulate merging change and delete')),
                      ] + cmdutil.walkopts + cmdutil.mergetoolopts,
                      _('[PATTERN]...'),
                      inferrepo=True)
              def debugpickmergetool(ui, repo, *pats, **opts):
                  """examine which merge tool is chosen for specified file
                  As described in :hg:`help merge-tools`, Mercurial examines
                  configurations below in this order to decide which merge tool is
                  chosen for specified file.
 . ``--tool`` option
 . ``HGMERGE`` environment variable
 . configurations in ``merge-patterns`` section
 . configuration of ``ui.merge``
 . configurations in ``merge-tools`` section
 . ``hgmerge`` tool (for historical reason only)
 . default tool for fallback (``:merge`` or ``:prompt``)
                  This command writes out examination result in the style below::
                      FILE = MERGETOOL
                  By default, all files known in the first parent context of the
                  working directory are examined. Use file patterns and/or -I/-X
                  options to limit target files. -r/--rev is also useful to examine
                  files in another context without actual updating to it.
                  With --debug, this command shows warning messages while matching
                  against ``merge-patterns`` and so on, too. It is recommended to
                  use this option with explicit file patterns and/or -I/-X options,
                  because this option increases amount of output per file according
                  to configurations in hgrc.
                  With -v/--verbose, this command shows configurations below at
                  first (only if specified).
                  - ``--tool`` option
                  - ``HGMERGE`` environment variable
                  - configuration of ``ui.merge``
                  If merge tool is chosen before matching against
                  ``merge-patterns``, this command can't show any helpful
                  information, even with --debug. In such case, information above is
                  useful to know why a merge tool is chosen.
                  """
                  opts = pycompat.byteskwargs(opts)
                  overrides = {}
                  if opts['tool']:
                      overrides[('ui', 'forcemerge')] = opts['tool']
                      ui.note(('with --tool %r\n') % (pycompat.bytestr(opts['tool'])))
                  with ui.configoverride(overrides, 'debugmergepatterns'):
                      hgmerge = encoding.environ.get("HGMERGE")
                      if hgmerge is not None:
                          ui.note(('with HGMERGE=%r\n') % (pycompat.bytestr(hgmerge)))
                      uimerge = ui.config("ui", "merge")
                      if uimerge:
                          ui.note(('with ui.merge=%r\n') % (pycompat.bytestr(uimerge)))
                      ctx = scmutil.revsingle(repo, opts.get('rev'))
                      m = scmutil.match(ctx, pats, opts)
                      changedelete = opts['changedelete']
                      for path in ctx.walk(m):
                          fctx = ctx[path]
                          try:
                              if not ui.debugflag:
                                  ui.pushbuffer(error=True)
                              tool, toolpath = filemerge._picktool(repo, ui, path,
                                                                   fctx.isbinary(),
                                                                   'l' in fctx.flags(),
                                                                   changedelete)
                          finally:
                              if not ui.debugflag:
                                  ui.popbuffer()
                          ui.write(('%s = %s\n') % (path, tool))
              @command('debugpushkey', [], _('REPO NAMESPACE [KEY OLD NEW]'), norepo=True)
              def debugpushkey(ui, repopath, namespace, *keyinfo, **opts):
                  '''access the pushkey key/value protocol
                  With two args, list the keys in the given namespace.
                  With five args, set a key to new if it currently is set to old.
                  Reports success or failure.
                  '''
                  target = hg.peer(ui, {}, repopath)
                  if keyinfo:
                      key, old, new = keyinfo
                      with target.commandexecutor() as e:
                          r = e.callcommand('pushkey', {
                              'namespace': namespace,
                              'key': key,
                              'old': old,
                              'new': new,
                          }).result()
                      ui.status(pycompat.bytestr(r) + '\n')
                      return not r
                  else:
                      for k, v in sorted(target.listkeys(namespace).iteritems()):
                          ui.write("%s\t%s\n" % (stringutil.escapestr(k),
                                                 stringutil.escapestr(v)))
              @command('debugpvec', [], _('A B'))
              def debugpvec(ui, repo, a, b=None):
                  ca = scmutil.revsingle(repo, a)
                  cb = scmutil.revsingle(repo, b)
                  pa = pvec.ctxpvec(ca)
                  pb = pvec.ctxpvec(cb)
                  if pa == pb:
                      rel = "="
                  elif pa > pb:
                      rel = ">"
                  elif pa < pb:
                      rel = "<"
                  elif pa | pb:
                      rel = "|"
                  ui.write(_("a: %s\n") % pa)
                  ui.write(_("b: %s\n") % pb)
                  ui.write(_("depth(a): %d depth(b): %d\n") % (pa._depth, pb._depth))
                  ui.write(_("delta: %d hdist: %d distance: %d relation: %s\n") %
                           (abs(pa._depth - pb._depth), pvec._hamming(pa._vec, pb._vec),
                            pa.distance(pb), rel))
              @command('debugrebuilddirstate|debugrebuildstate',
                  [('r', 'rev', '', _('revision to rebuild to'), _('REV')),
                   ('', 'minimal', None, _('only rebuild files that are inconsistent with '
                                           'the working copy parent')),
                  ],
                  _('[-r REV]'))
              def debugrebuilddirstate(ui, repo, rev, **opts):
                  """rebuild the dirstate as it would look like for the given revision
                  If no revision is specified the first current parent will be used.
                  The dirstate will be set to the files of the given revision.
                  The actual working directory content or existing dirstate
                  information such as adds or removes is not considered.
                  ``minimal`` will only rebuild the dirstate status for files that claim to be
                  tracked but are not in the parent manifest, or that exist in the parent
                  manifest but are not in the dirstate. It will not change adds, removes, or
                  modified files that are in the working copy parent.
                  One use of this command is to make the next :hg:`status` invocation
                  check the actual file content.
                  """
                  ctx = scmutil.revsingle(repo, rev)
                  with repo.wlock():
                      dirstate = repo.dirstate
                      changedfiles = None
                      # See command doc for what minimal does.
                      if opts.get(r'minimal'):
                          manifestfiles = set(ctx.manifest().keys())
                          dirstatefiles = set(dirstate)
                          manifestonly = manifestfiles - dirstatefiles
                          dsonly = dirstatefiles - manifestfiles
                          dsnotadded = set(f for f in dsonly if dirstate[f] != 'a')
                          changedfiles = manifestonly | dsnotadded
                      dirstate.rebuild(ctx.node(), ctx.manifest(), changedfiles)
              @command('debugrebuildfncache', [], '')
              def debugrebuildfncache(ui, repo):
                  """rebuild the fncache file"""
                  repair.rebuildfncache(ui, repo)
              @command('debugrename',
                  [('r', 'rev', '', _('revision to debug'), _('REV'))],
                  _('[-r REV] FILE'))
              def debugrename(ui, repo, file1, *pats, **opts):
                  """dump rename information"""
                  opts = pycompat.byteskwargs(opts)
                  ctx = scmutil.revsingle(repo, opts.get('rev'))
                  m = scmutil.match(ctx, (file1,) + pats, opts)
                  for abs in ctx.walk(m):
                      fctx = ctx[abs]
                      o = fctx.filelog().renamed(fctx.filenode())
                      rel = m.rel(abs)
                      if o:
                          ui.write(_("%s renamed from %s:%s\n") % (rel, o[0], hex(o[1])))
                      else:
                          ui.write(_("%s not renamed\n") % rel)
              @command('debugrevlog', cmdutil.debugrevlogopts +
                  [('d', 'dump', False, _('dump index data'))],
                  _('-c|-m|FILE'),
                  optionalrepo=True)
              def debugrevlog(ui, repo, file_=None, **opts):
                  """show data and statistics about a revlog"""
                  opts = pycompat.byteskwargs(opts)
                  r = cmdutil.openrevlog(repo, 'debugrevlog', file_, opts)
                  if opts.get("dump"):
                      numrevs = len(r)
                      ui.write(("# rev p1rev p2rev start   end deltastart base   p1   p2"
                               " rawsize totalsize compression heads chainlen\n"))
                      ts = 0
                      heads = set()
                      for rev in pycompat.xrange(numrevs):
                          dbase = r.deltaparent(rev)
                          if dbase == -1:
                              dbase = rev
                          cbase = r.chainbase(rev)
                          clen = r.chainlen(rev)
                          p1, p2 = r.parentrevs(rev)
                          rs = r.rawsize(rev)
                          ts = ts + rs
                          heads -= set(r.parentrevs(rev))
                          heads.add(rev)
                          try:
                              compression = ts / r.end(rev)
                          except ZeroDivisionError:
                              compression = 0
                          ui.write("%5d %5d %5d %5d %5d %10d %4d %4d %4d %7d %9d "
                                   "%11d %5d %8d\n" %
                                   (rev, p1, p2, r.start(rev), r.end(rev),
                                    r.start(dbase), r.start(cbase),
                                    r.start(p1), r.start(p2),
                                    rs, ts, compression, len(heads), clen))
                      return 0
                  v = r.version
                  format = v & 0xFFFF
                  flags = []
                  gdelta = False
                  if v & revlog.FLAG_INLINE_DATA:
                      flags.append('inline')
                  if v & revlog.FLAG_GENERALDELTA:
                      gdelta = True
                      flags.append('generaldelta')
                  if not flags:
                      flags = ['(none)']
                  ### tracks merge vs single parent
                  nummerges = 0
                  ### tracks ways the "delta" are build
                  # nodelta
                  numempty = 0
                  numemptytext = 0
                  numemptydelta = 0
                  # full file content
                  numfull = 0
                  # intermediate snapshot against a prior snapshot
                  numsemi = 0
                  # snapshot count per depth
                  numsnapdepth = collections.defaultdict(lambda: 0)
                  # delta against previous revision
                  numprev = 0
                  # delta against first or second parent (not prev)
                  nump1 = 0
                  nump2 = 0
                  # delta against neither prev nor parents
                  numother = 0
                  # delta against prev that are also first or second parent
                  # (details of `numprev`)
                  nump1prev = 0
                  nump2prev = 0
                  # data about delta chain of each revs
                  chainlengths = []
                  chainbases = []
                  chainspans = []
                  # data about each revision
                  datasize = [None, 0, 0]
                  fullsize = [None, 0, 0]
                  semisize = [None, 0, 0]
                  # snapshot count per depth
                  snapsizedepth = collections.defaultdict(lambda: [None, 0, 0])
                  deltasize = [None, 0, 0]
                  chunktypecounts = {}
                  chunktypesizes = {}
                  def addsize(size, l):
                      if l[0] is None or size < l[0]:
                          l[0] = size
                      if size > l[1]:
                          l[1] = size
                      l[2] += size
                  numrevs = len(r)
                  for rev in pycompat.xrange(numrevs):
                      p1, p2 = r.parentrevs(rev)
                      delta = r.deltaparent(rev)
                      if format > 0:
                          addsize(r.rawsize(rev), datasize)
                      if p2 != nullrev:
                          nummerges += 1
                      size = r.length(rev)
                      if delta == nullrev:
                          chainlengths.append(0)
                          chainbases.append(r.start(rev))
                          chainspans.append(size)
                          if size == 0:
                              numempty += 1
                              numemptytext += 1
                          else:
                              numfull += 1
                              numsnapdepth[0] += 1
                              addsize(size, fullsize)
                              addsize(size, snapsizedepth[0])
                      else:
                          chainlengths.append(chainlengths[delta] + 1)
                          baseaddr = chainbases[delta]
                          revaddr = r.start(rev)
                          chainbases.append(baseaddr)
                          chainspans.append((revaddr - baseaddr) + size)
                          if size == 0:
                              numempty += 1
                              numemptydelta += 1
                          elif r.issnapshot(rev):
                              addsize(size, semisize)
                              numsemi += 1
                              depth = r.snapshotdepth(rev)
                              numsnapdepth[depth] += 1
                              addsize(size, snapsizedepth[depth])
                          else:
                              addsize(size, deltasize)
                              if delta == rev - 1:
                                  numprev += 1
                                  if delta == p1:
                                      nump1prev += 1
                                  elif delta == p2:
                                      nump2prev += 1
                              elif delta == p1:
                                  nump1 += 1
                              elif delta == p2:
                                  nump2 += 1
                              elif delta != nullrev:
                                  numother += 1
                      # Obtain data on the raw chunks in the revlog.
                      if util.safehasattr(r, '_getsegmentforrevs'):
                          segment = r._getsegmentforrevs(rev, rev)[1]
                      else:
                          segment = r._revlog._getsegmentforrevs(rev, rev)[1]
                      if segment:
                          chunktype = bytes(segment[0:1])
                      else:
                          chunktype = 'empty'
                      if chunktype not in chunktypecounts:
                          chunktypecounts[chunktype] = 0
                          chunktypesizes[chunktype] = 0
                      chunktypecounts[chunktype] += 1
                      chunktypesizes[chunktype] += size
                  # Adjust size min value for empty cases
                  for size in (datasize, fullsize, semisize, deltasize):
                      if size[0] is None:
                          size[0] = 0
                  numdeltas = numrevs - numfull - numempty - numsemi
                  numoprev = numprev - nump1prev - nump2prev
                  totalrawsize = datasize[2]
                  datasize[2] /= numrevs
                  fulltotal = fullsize[2]
                  fullsize[2] /= numfull
                  semitotal = semisize[2]
                  snaptotal = {}
                  if 0 < numsemi:
                      semisize[2] /= numsemi
                  for depth in snapsizedepth:
                      snaptotal[depth] = snapsizedepth[depth][2]
                      snapsizedepth[depth][2] /= numsnapdepth[depth]
                  deltatotal = deltasize[2]
                  if numdeltas > 0:
                      deltasize[2] /= numdeltas
                  totalsize = fulltotal + semitotal + deltatotal
                  avgchainlen = sum(chainlengths) / numrevs
                  maxchainlen = max(chainlengths)
                  maxchainspan = max(chainspans)
                  compratio = 1
                  if totalsize:
                      compratio = totalrawsize / totalsize
                  basedfmtstr = '%%%dd\n'
                  basepcfmtstr = '%%%dd %s(%%5.2f%%%%)\n'
                  def dfmtstr(max):
                      return basedfmtstr % len(str(max))
                  def pcfmtstr(max, padding=0):
                      return basepcfmtstr % (len(str(max)), ' ' * padding)
                  def pcfmt(value, total):
                      if total:
                          return (value, 100 * float(value) / total)
                      else:
                          return value, 100.0
                  ui.write(('format : %d\n') % format)
                  ui.write(('flags  : %s\n') % ', '.join(flags))
                  ui.write('\n')
                  fmt = pcfmtstr(totalsize)
                  fmt2 = dfmtstr(totalsize)
                  ui.write(('revisions     : ') + fmt2 % numrevs)
                  ui.write(('    merges    : ') + fmt % pcfmt(nummerges, numrevs))
                  ui.write(('    normal    : ') + fmt % pcfmt(numrevs - nummerges, numrevs))
                  ui.write(('revisions     : ') + fmt2 % numrevs)
                  ui.write(('    empty     : ') + fmt % pcfmt(numempty, numrevs))
                  ui.write(('                   text  : ')
                           + fmt % pcfmt(numemptytext, numemptytext + numemptydelta))
                  ui.write(('                   delta : ')
                           + fmt % pcfmt(numemptydelta, numemptytext + numemptydelta))
                  ui.write(('    snapshot  : ') + fmt % pcfmt(numfull + numsemi, numrevs))
                  for depth in sorted(numsnapdepth):
                      ui.write(('      lvl-%-3d :       ' % depth)
                               + fmt % pcfmt(numsnapdepth[depth], numrevs))
                  ui.write(('    deltas    : ') + fmt % pcfmt(numdeltas, numrevs))
                  ui.write(('revision size : ') + fmt2 % totalsize)
                  ui.write(('    snapshot  : ')
                           + fmt % pcfmt(fulltotal + semitotal, totalsize))
                  for depth in sorted(numsnapdepth):
                      ui.write(('      lvl-%-3d :       ' % depth)
                               + fmt % pcfmt(snaptotal[depth], totalsize))
                  ui.write(('    deltas    : ') + fmt % pcfmt(deltatotal, totalsize))
                  def fmtchunktype(chunktype):
                      if chunktype == 'empty':
                          return '    %s     : ' % chunktype
                      elif chunktype in pycompat.bytestr(string.ascii_letters):
                          return '    0x%s (%s)  : ' % (hex(chunktype), chunktype)
                      else:
                          return '    0x%s      : ' % hex(chunktype)
                  ui.write('\n')
                  ui.write(('chunks        : ') + fmt2 % numrevs)
                  for chunktype in sorted(chunktypecounts):
                      ui.write(fmtchunktype(chunktype))
                      ui.write(fmt % pcfmt(chunktypecounts[chunktype], numrevs))
                  ui.write(('chunks size   : ') + fmt2 % totalsize)
                  for chunktype in sorted(chunktypecounts):
                      ui.write(fmtchunktype(chunktype))
                      ui.write(fmt % pcfmt(chunktypesizes[chunktype], totalsize))
                  ui.write('\n')
                  fmt = dfmtstr(max(avgchainlen, maxchainlen, maxchainspan, compratio))
                  ui.write(('avg chain length  : ') + fmt % avgchainlen)
                  ui.write(('max chain length  : ') + fmt % maxchainlen)
                  ui.write(('max chain reach   : ') + fmt % maxchainspan)
                  ui.write(('compression ratio : ') + fmt % compratio)
                  if format > 0:
                      ui.write('\n')
                      ui.write(('uncompressed data size (min/max/avg) : %d / %d / %d\n')
                               % tuple(datasize))
                  ui.write(('full revision size (min/max/avg)     : %d / %d / %d\n')
                           % tuple(fullsize))
                  ui.write(('inter-snapshot size (min/max/avg)    : %d / %d / %d\n')
                           % tuple(semisize))
                  for depth in sorted(snapsizedepth):
                      if depth == 0:
                          continue
                      ui.write(('    level-%-3d (min/max/avg)          : %d / %d / %d\n')
                               % ((depth,) + tuple(snapsizedepth[depth])))
                  ui.write(('delta size (min/max/avg)             : %d / %d / %d\n')
                           % tuple(deltasize))
                  if numdeltas > 0:
                      ui.write('\n')
                      fmt = pcfmtstr(numdeltas)
                      fmt2 = pcfmtstr(numdeltas, 4)
                      ui.write(('deltas against prev  : ') + fmt % pcfmt(numprev, numdeltas))
                      if numprev > 0:
                          ui.write(('    where prev = p1  : ') + fmt2 % pcfmt(nump1prev,
                                                                            numprev))
                          ui.write(('    where prev = p2  : ') + fmt2 % pcfmt(nump2prev,
                                                                            numprev))
                          ui.write(('    other            : ') + fmt2 % pcfmt(numoprev,
                                                                            numprev))
                      if gdelta:
                          ui.write(('deltas against p1    : ')
                                   + fmt % pcfmt(nump1, numdeltas))
                          ui.write(('deltas against p2    : ')
                                   + fmt % pcfmt(nump2, numdeltas))
                          ui.write(('deltas against other : ') + fmt % pcfmt(numother,
                                                                           numdeltas))
              @command('debugrevlogindex', cmdutil.debugrevlogopts +
                  [('f', 'format', 0, _('revlog format'), _('FORMAT'))],
                  _('[-f FORMAT] -c|-m|FILE'),
                  optionalrepo=True)
              def debugrevlogindex(ui, repo, file_=None, **opts):
                  """dump the contents of a revlog index"""
                  opts = pycompat.byteskwargs(opts)
                  r = cmdutil.openrevlog(repo, 'debugrevlogindex', file_, opts)
                  format = opts.get('format', 0)
                  if format not in (0, 1):
                      raise error.Abort(_("unknown format %d") % format)
                  if ui.debugflag:
                      shortfn = hex
                  else:
                      shortfn = short
                  # There might not be anything in r, so have a sane default
                  idlen = 12
                  for i in r:
                      idlen = len(shortfn(r.node(i)))
                      break
                  if format == 0:
                      if ui.verbose:
                          ui.write(("   rev    offset  length linkrev"
                                   " %s %s p2\n") % ("nodeid".ljust(idlen),
                                                     "p1".ljust(idlen)))
                      else:
                          ui.write(("   rev linkrev %s %s p2\n") % (
                              "nodeid".ljust(idlen), "p1".ljust(idlen)))
                  elif format == 1:
                      if ui.verbose:
                          ui.write(("   rev flag   offset   length     size   link     p1"
                                    "     p2 %s\n") % "nodeid".rjust(idlen))
                      else:
                          ui.write(("   rev flag     size   link     p1     p2 %s\n") %
                                   "nodeid".rjust(idlen))
                  for i in r:
                      node = r.node(i)
                      if format == 0:
                          try:
                              pp = r.parents(node)
                          except Exception:
                              pp = [nullid, nullid]
                          if ui.verbose:
                              ui.write("% 6d % 9d % 7d % 7d %s %s %s\n" % (
                                      i, r.start(i), r.length(i), r.linkrev(i),
                                      shortfn(node), shortfn(pp[0]), shortfn(pp[1])))
                          else:
                              ui.write("% 6d % 7d %s %s %s\n" % (
                                  i, r.linkrev(i), shortfn(node), shortfn(pp[0]),
                                  shortfn(pp[1])))
                      elif format == 1:
                          pr = r.parentrevs(i)
                          if ui.verbose:
                              ui.write("% 6d %04x % 8d % 8d % 8d % 6d % 6d % 6d %s\n" % (
                                      i, r.flags(i), r.start(i), r.length(i), r.rawsize(i),
                                      r.linkrev(i), pr[0], pr[1], shortfn(node)))
                          else:
                              ui.write("% 6d %04x % 8d % 6d % 6d % 6d %s\n" % (
                                  i, r.flags(i), r.rawsize(i), r.linkrev(i), pr[0], pr[1],
                                  shortfn(node)))
              @command('debugrevspec',
                  [('', 'optimize', None,
                    _('print parsed tree after optimizing (DEPRECATED)')),
                   ('', 'show-revs', True, _('print list of result revisions (default)')),
                   ('s', 'show-set', None, _('print internal representation of result set')),
                   ('p', 'show-stage', [],
                    _('print parsed tree at the given stage'), _('NAME')),
                   ('', 'no-optimized', False, _('evaluate tree without optimization')),
                   ('', 'verify-optimized', False, _('verify optimized result')),
                   ],
                  ('REVSPEC'))
              def debugrevspec(ui, repo, expr, **opts):
                  """parse and apply a revision specification
                  Use -p/--show-stage option to print the parsed tree at the given stages.
                  Use -p all to print tree at every stage.
                  Use --no-show-revs option with -s or -p to print only the set
                  representation or the parsed tree respectively.
                  Use --verify-optimized to compare the optimized result with the unoptimized
                  one. Returns 1 if the optimized result differs.
                  """
                  opts = pycompat.byteskwargs(opts)
                  aliases = ui.configitems('revsetalias')
                  stages = [
                      ('parsed', lambda tree: tree),
                      ('expanded', lambda tree: revsetlang.expandaliases(tree, aliases,
                                                                         ui.warn)),
                      ('concatenated', revsetlang.foldconcat),
                      ('analyzed', revsetlang.analyze),
                      ('optimized', revsetlang.optimize),
                  ]
                  if opts['no_optimized']:
                      stages = stages[:-1]
                  if opts['verify_optimized'] and opts['no_optimized']:
                      raise error.Abort(_('cannot use --verify-optimized with '
                                          '--no-optimized'))
                  stagenames = set(n for n, f in stages)
                  showalways = set()
                  showchanged = set()
                  if ui.verbose and not opts['show_stage']:
                      # show parsed tree by --verbose (deprecated)
                      showalways.add('parsed')
                      showchanged.update(['expanded', 'concatenated'])
                      if opts['optimize']:
                          showalways.add('optimized')
                  if opts['show_stage'] and opts['optimize']:
                      raise error.Abort(_('cannot use --optimize with --show-stage'))
                  if opts['show_stage'] == ['all']:
                      showalways.update(stagenames)
                  else:
                      for n in opts['show_stage']:
                          if n not in stagenames:
                              raise error.Abort(_('invalid stage name: %s') % n)
                      showalways.update(opts['show_stage'])
                  treebystage = {}
                  printedtree = None
                  tree = revsetlang.parse(expr, lookup=revset.lookupfn(repo))
                  for n, f in stages:
                      treebystage[n] = tree = f(tree)
                      if n in showalways or (n in showchanged and tree != printedtree):
                          if opts['show_stage'] or n != 'parsed':
                              ui.write(("* %s:\n") % n)
                          ui.write(revsetlang.prettyformat(tree), "\n")
                          printedtree = tree
                  if opts['verify_optimized']:
                      arevs = revset.makematcher(treebystage['analyzed'])(repo)
                      brevs = revset.makematcher(treebystage['optimized'])(repo)
                      if opts['show_set'] or (opts['show_set'] is None and ui.verbose):
                          ui.write(("* analyzed set:\n"), stringutil.prettyrepr(arevs), "\n")
                          ui.write(("* optimized set:\n"), stringutil.prettyrepr(brevs), "\n")
                      arevs = list(arevs)
                      brevs = list(brevs)
                      if arevs == brevs:
                          return 0
                      ui.write(('--- analyzed\n'), label='diff.file_a')
                      ui.write(('+++ optimized\n'), label='diff.file_b')
                      sm = difflib.SequenceMatcher(None, arevs, brevs)
                      for tag, alo, ahi, blo, bhi in sm.get_opcodes():
                          if tag in ('delete', 'replace'):
                              for c in arevs[alo:ahi]:
                                  ui.write('-%s\n' % c, label='diff.deleted')
                          if tag in ('insert', 'replace'):
                              for c in brevs[blo:bhi]:
                                  ui.write('+%s\n' % c, label='diff.inserted')
                          if tag == 'equal':
                              for c in arevs[alo:ahi]:
                                  ui.write(' %s\n' % c)
                      return 1
                  func = revset.makematcher(tree)
                  revs = func(repo)
                  if opts['show_set'] or (opts['show_set'] is None and ui.verbose):
                      ui.write(("* set:\n"), stringutil.prettyrepr(revs), "\n")
                  if not opts['show_revs']:
                      return
                  for c in revs:
                      ui.write("%d\n" % c)
              @command('debugserve', [
                  ('', 'sshstdio', False, _('run an SSH server bound to process handles')),
                  ('', 'logiofd', '', _('file descriptor to log server I/O to')),
                  ('', 'logiofile', '', _('file to log server I/O to')),
              ], '')
              def debugserve(ui, repo, **opts):
                  """run a server with advanced settings
                  This command is similar to :hg:`serve`. It exists partially as a
                  workaround to the fact that ``hg serve --stdio`` must have specific
                  arguments for security reasons.
                  """
                  opts = pycompat.byteskwargs(opts)
                  if not opts['sshstdio']:
                      raise error.Abort(_('only --sshstdio is currently supported'))
                  logfh = None
                  if opts['logiofd'] and opts['logiofile']:
                      raise error.Abort(_('cannot use both --logiofd and --logiofile'))
                  if opts['logiofd']:
                      # Line buffered because output is line based.
                      try:
                          logfh = os.fdopen(int(opts['logiofd']), r'ab', 1)
                      except OSError as e:
                          if e.errno != errno.ESPIPE:
                              raise
                          # can't seek a pipe, so `ab` mode fails on py3
                          logfh = os.fdopen(int(opts['logiofd']), r'wb', 1)
                  elif opts['logiofile']:
                      logfh = open(opts['logiofile'], 'ab', 1)
                  s = wireprotoserver.sshserver(ui, repo, logfh=logfh)
                  s.serve_forever()
              @command('debugsetparents', [], _('REV1 [REV2]'))
              def debugsetparents(ui, repo, rev1, rev2=None):
                  """manually set the parents of the current working directory
                  This is useful for writing repository conversion tools, but should
                  be used with care. For example, neither the working directory nor the
                  dirstate is updated, so file status may be incorrect after running this
                  command.
                  Returns 0 on success.
                  """
                  node1 = scmutil.revsingle(repo, rev1).node()
                  node2 = scmutil.revsingle(repo, rev2, 'null').node()
                  with repo.wlock():
                      repo.setparents(node1, node2)
              @command('debugssl', [], '[SOURCE]', optionalrepo=True)
              def debugssl(ui, repo, source=None, **opts):
                  '''test a secure connection to a server
                  This builds the certificate chain for the server on Windows, installing the
                  missing intermediates and trusted root via Windows Update if necessary.  It
                  does nothing on other platforms.
                  If SOURCE is omitted, the 'default' path will be used.  If a URL is given,
                  that server is used. See :hg:`help urls` for more information.
                  If the update succeeds, retry the original operation.  Otherwise, the cause
                  of the SSL error is likely another issue.
                  '''
                  if not pycompat.iswindows:
                      raise error.Abort(_('certificate chain building is only possible on '
                                          'Windows'))
                  if not source:
                      if not repo:
                          raise error.Abort(_("there is no Mercurial repository here, and no "
                                              "server specified"))
                      source = "default"
                  source, branches = hg.parseurl(ui.expandpath(source))
                  url = util.url(source)
                  addr = None
                  defaultport = {'https': 443, 'ssh': 22}
                  if url.scheme in defaultport:
                      try:
                          addr = (url.host, int(url.port or defaultport[url.scheme]))
                      except ValueError:
                          raise error.Abort(_("malformed port number in URL"))
                  else:
                      raise error.Abort(_("only https and ssh connections are supported"))
                  from . import win32
                  s = ssl.wrap_socket(socket.socket(), ssl_version=ssl.PROTOCOL_TLS,
                                      cert_reqs=ssl.CERT_NONE, ca_certs=None)
                  try:
                      s.connect(addr)
                      cert = s.getpeercert(True)
                      ui.status(_('checking the certificate chain for %s\n') % url.host)
                      complete = win32.checkcertificatechain(cert, build=False)
                      if not complete:
                          ui.status(_('certificate chain is incomplete, updating... '))
                          if not win32.checkcertificatechain(cert):
                              ui.status(_('failed.\n'))
                          else:
                              ui.status(_('done.\n'))
                      else:
                          ui.status(_('full certificate chain is available\n'))
                  finally:
                      s.close()
              @command('debugsub',
                  [('r', 'rev', '',
                   _('revision to check'), _('REV'))],
                  _('[-r REV] [REV]'))
              def debugsub(ui, repo, rev=None):
                  ctx = scmutil.revsingle(repo, rev, None)
                  for k, v in sorted(ctx.substate.items()):
                      ui.write(('path %s\n') % k)
                      ui.write((' source   %s\n') % v[0])
                      ui.write((' revision %s\n') % v[1])
              @command('debugsuccessorssets',
                  [('', 'closest', False, _('return closest successors sets only'))],
                  _('[REV]'))
              def debugsuccessorssets(ui, repo, *revs, **opts):
                  """show set of successors for revision
                  A successors set of changeset A is a consistent group of revisions that
                  succeed A. It contains non-obsolete changesets only unless closests
                  successors set is set.
                  In most cases a changeset A has a single successors set containing a single
                  successor (changeset A replaced by A').
                  A changeset that is made obsolete with no successors are called "pruned".
                  Such changesets have no successors sets at all.
                  A changeset that has been "split" will have a successors set containing
                  more than one successor.
                  A changeset that has been rewritten in multiple different ways is called
                  "divergent". Such changesets have multiple successor sets (each of which
                  may also be split, i.e. have multiple successors).
                  Results are displayed as follows::
                      <rev1>
                          <successors-1A>
                      <rev2>
                          <successors-2A>
                          <successors-2B1> <successors-2B2> <successors-2B3>
                  Here rev2 has two possible (i.e. divergent) successors sets. The first
                  holds one element, whereas the second holds three (i.e. the changeset has
                  been split).
                  """
                  # passed to successorssets caching computation from one call to another
                  cache = {}
                  ctx2str = bytes
                  node2str = short
                  for rev in scmutil.revrange(repo, revs):
                      ctx = repo[rev]
                      ui.write('%s\n'% ctx2str(ctx))
                      for succsset in obsutil.successorssets(repo, ctx.node(),
                                                              closest=opts[r'closest'],
                                                              cache=cache):
                          if succsset:
                              ui.write('    ')
                              ui.write(node2str(succsset[0]))
                              for node in succsset[1:]:
                                  ui.write(' ')
                                  ui.write(node2str(node))
                          ui.write('\n')
              @command('debugtemplate',
                  [('r', 'rev', [], _('apply template on changesets'), _('REV')),
                   ('D', 'define', [], _('define template keyword'), _('KEY=VALUE'))],
                  _('[-r REV]... [-D KEY=VALUE]... TEMPLATE'),
                  optionalrepo=True)
              def debugtemplate(ui, repo, tmpl, **opts):
                  """parse and apply a template
                  If -r/--rev is given, the template is processed as a log template and
                  applied to the given changesets. Otherwise, it is processed as a generic
                  template.
                  Use --verbose to print the parsed tree.
                  """
                  revs = None
                  if opts[r'rev']:
                      if repo is None:
                          raise error.RepoError(_('there is no Mercurial repository here '
                                                  '(.hg not found)'))
                      revs = scmutil.revrange(repo, opts[r'rev'])
                  props = {}
                  for d in opts[r'define']:
                      try:
                          k, v = (e.strip() for e in d.split('=', 1))
                          if not k or k == 'ui':
                              raise ValueError
                          props[k] = v
                      except ValueError:
                          raise error.Abort(_('malformed keyword definition: %s') % d)
                  if ui.verbose:
                      aliases = ui.configitems('templatealias')
                      tree = templater.parse(tmpl)
                      ui.note(templater.prettyformat(tree), '\n')
                      newtree = templater.expandaliases(tree, aliases)
                      if newtree != tree:
                          ui.note(("* expanded:\n"), templater.prettyformat(newtree), '\n')
                  if revs is None:
                      tres = formatter.templateresources(ui, repo)
                      t = formatter.maketemplater(ui, tmpl, resources=tres)
                      if ui.verbose:
                          kwds, funcs = t.symbolsuseddefault()
                          ui.write(("* keywords: %s\n") % ', '.join(sorted(kwds)))
                          ui.write(("* functions: %s\n") % ', '.join(sorted(funcs)))
                      ui.write(t.renderdefault(props))
                  else:
                      displayer = logcmdutil.maketemplater(ui, repo, tmpl)
                      if ui.verbose:
                          kwds, funcs = displayer.t.symbolsuseddefault()
                          ui.write(("* keywords: %s\n") % ', '.join(sorted(kwds)))
                          ui.write(("* functions: %s\n") % ', '.join(sorted(funcs)))
                      for r in revs:
                          displayer.show(repo[r], **pycompat.strkwargs(props))
                      displayer.close()
              @command('debuguigetpass', [
                  ('p', 'prompt', '', _('prompt text'), _('TEXT')),
              ], _('[-p TEXT]'), norepo=True)
              def debuguigetpass(ui, prompt=''):
                  """show prompt to type password"""
                  r = ui.getpass(prompt)
                  ui.write(('respose: %s\n') % r)
              @command('debuguiprompt', [
                  ('p', 'prompt', '', _('prompt text'), _('TEXT')),
              ], _('[-p TEXT]'), norepo=True)
              def debuguiprompt(ui, prompt=''):
                  """show plain prompt"""
                  r = ui.prompt(prompt)
                  ui.write(('response: %s\n') % r)
              @command('debugupdatecaches', [])
              def debugupdatecaches(ui, repo, *pats, **opts):
                  """warm all known caches in the repository"""
                  with repo.wlock(), repo.lock():
                      repo.updatecaches(full=True)
              @command('debugupgraderepo', [
                  ('o', 'optimize', [], _('extra optimization to perform'), _('NAME')),
                  ('', 'run', False, _('performs an upgrade')),
              ])
              def debugupgraderepo(ui, repo, run=False, optimize=None):
                  """upgrade a repository to use different features
                  If no arguments are specified, the repository is evaluated for upgrade
                  and a list of problems and potential optimizations is printed.
                  With ``--run``, a repository upgrade is performed. Behavior of the upgrade
                  can be influenced via additional arguments. More details will be provided
                  by the command output when run without ``--run``.
                  During the upgrade, the repository will be locked and no writes will be
                  allowed.
                  At the end of the upgrade, the repository may not be readable while new
                  repository data is swapped in. This window will be as long as it takes to
                  rename some directories inside the ``.hg`` directory. On most machines, this
                  should complete almost instantaneously and the chances of a consumer being
                  unable to access the repository should be low.
                  """
                  return upgrade.upgraderepo(ui, repo, run=run, optimize=optimize)
              @command('debugwalk', cmdutil.walkopts, _('[OPTION]... [FILE]...'),
                       inferrepo=True)
              def debugwalk(ui, repo, *pats, **opts):
                  """show how files match on given patterns"""
                  opts = pycompat.byteskwargs(opts)
                  m = scmutil.match(repo[None], pats, opts)
                  if ui.verbose:
                      ui.write(('* matcher:\n'), stringutil.prettyrepr(m), '\n')
                  items = list(repo[None].walk(m))
                  if not items:
                      return
                  f = lambda fn: fn
                  if ui.configbool('ui', 'slash') and pycompat.ossep != '/':
                      f = lambda fn: util.normpath(fn)
                  fmt = 'f  %%-%ds  %%-%ds  %%s' % (
                      max([len(abs) for abs in items]),
                      max([len(m.rel(abs)) for abs in items]))
                  for abs in items:
                      line = fmt % (abs, f(m.rel(abs)), m.exact(abs) and 'exact' or '')
                      ui.write("%s\n" % line.rstrip())
              @command('debugwhyunstable', [], _('REV'))
              def debugwhyunstable(ui, repo, rev):
                  """explain instabilities of a changeset"""
                  for entry in obsutil.whyunstable(repo, scmutil.revsingle(repo, rev)):
                      dnodes = ''
                      if entry.get('divergentnodes'):
                          dnodes = ' '.join('%s (%s)' % (ctx.hex(), ctx.phasestr())
                                            for ctx in entry['divergentnodes']) + ' '
                      ui.write('%s: %s%s %s\n' % (entry['instability'], dnodes,
                                                  entry['reason'], entry['node']))
              @command('debugwireargs',
                  [('', 'three', '', 'three'),
                  ('', 'four', '', 'four'),
                  ('', 'five', '', 'five'),
                  ] + cmdutil.remoteopts,
                  _('REPO [OPTIONS]... [ONE [TWO]]'),
                  norepo=True)
              def debugwireargs(ui, repopath, *vals, **opts):
                  opts = pycompat.byteskwargs(opts)
                  repo = hg.peer(ui, opts, repopath)
                  for opt in cmdutil.remoteopts:
                      del opts[opt[1]]
                  args = {}
                  for k, v in opts.iteritems():
                      if v:
                          args[k] = v
                  args = pycompat.strkwargs(args)
                  # run twice to check that we don't mess up the stream for the next command
                  res1 = repo.debugwireargs(*vals, **args)
                  res2 = repo.debugwireargs(*vals, **args)
                  ui.write("%s\n" % res1)
                  if res1 != res2:
                      ui.warn("%s\n" % res2)
              def _parsewirelangblocks(fh):
                  activeaction = None
                  blocklines = []
                  for line in fh:
                      line = line.rstrip()
                      if not line:
                          continue
                      if line.startswith(b'#'):
                          continue
                      if not line.startswith(b' '):
                          # New block. Flush previous one.
                          if activeaction:
                              yield activeaction, blocklines
                          activeaction = line
                          blocklines = []
                          continue
                      # Else we start with an indent.
                      if not activeaction:
                          raise error.Abort(_('indented line outside of block'))
                      blocklines.append(line)
                  # Flush last block.
                  if activeaction:
                      yield activeaction, blocklines
              @command('debugwireproto',
                  [
                      ('', 'localssh', False, _('start an SSH server for this repo')),
                      ('', 'peer', '', _('construct a specific version of the peer')),
                      ('', 'noreadstderr', False, _('do not read from stderr of the remote')),
                      ('', 'nologhandshake', False,
                       _('do not log I/O related to the peer handshake')),
                  ] + cmdutil.remoteopts,
                  _('[PATH]'),
                  optionalrepo=True)
              def debugwireproto(ui, repo, path=None, **opts):
                  """send wire protocol commands to a server
                  This command can be used to issue wire protocol commands to remote
                  peers and to debug the raw data being exchanged.
                  ``--localssh`` will start an SSH server against the current repository
                  and connect to that. By default, the connection will perform a handshake
                  and establish an appropriate peer instance.
                  ``--peer`` can be used to bypass the handshake protocol and construct a
                  peer instance using the specified class type. Valid values are ``raw``,
                  ``http2``, ``ssh1``, and ``ssh2``. ``raw`` instances only allow sending
                  raw data payloads and don't support higher-level command actions.
                  ``--noreadstderr`` can be used to disable automatic reading from stderr
                  of the peer (for SSH connections only). Disabling automatic reading of
                  stderr is useful for making output more deterministic.
                  Commands are issued via a mini language which is specified via stdin.
                  The language consists of individual actions to perform. An action is
                  defined by a block. A block is defined as a line with no leading
                  space followed by 0 or more lines with leading space. Blocks are
                  effectively a high-level command with additional metadata.
                  Lines beginning with ``#`` are ignored.
                  The following sections denote available actions.
                  raw
                  ---
                  Send raw data to the server.
                  The block payload contains the raw data to send as one atomic send
                  operation. The data may not actually be delivered in a single system
                  call: it depends on the abilities of the transport being used.
                  Each line in the block is de-indented and concatenated. Then, that
                  value is evaluated as a Python b'' literal. This allows the use of
                  backslash escaping, etc.
                  raw+
                  ----
                  Behaves like ``raw`` except flushes output afterwards.
                  command <X>
                  -----------
                  Send a request to run a named command, whose name follows the ``command``
                  string.
                  Arguments to the command are defined as lines in this block. The format of
                  each line is ``<key> <value>``. e.g.::
                     command listkeys
                         namespace bookmarks
                  If the value begins with ``eval:``, it will be interpreted as a Python
                  literal expression. Otherwise values are interpreted as Python b'' literals.
                  This allows sending complex types and encoding special byte sequences via
                  backslash escaping.
                  The following arguments have special meaning:
                  ``PUSHFILE``
                      When defined, the *push* mechanism of the peer will be used instead
                      of the static request-response mechanism and the content of the
                      file specified in the value of this argument will be sent as the
                      command payload.
                      This can be used to submit a local bundle file to the remote.
                  batchbegin
                  ----------
                  Instruct the peer to begin a batched send.
                  All ``command`` blocks are queued for execution until the next
                  ``batchsubmit`` block.
                  batchsubmit
                  -----------
                  Submit previously queued ``command`` blocks as a batch request.
                  This action MUST be paired with a ``batchbegin`` action.
                  httprequest <method> <path>
                  ---------------------------
                  (HTTP peer only)
                  Send an HTTP request to the peer.
                  The HTTP request line follows the ``httprequest`` action. e.g. ``GET /foo``.
                  Arguments of the form ``<key>: <value>`` are interpreted as HTTP request
                  headers to add to the request. e.g. ``Accept: foo``.
                  The following arguments are special:
                  ``BODYFILE``
                      The content of the file defined as the value to this argument will be
                      transferred verbatim as the HTTP request body.
                  ``frame <type> <flags> <payload>``
                      Send a unified protocol frame as part of the request body.
                      All frames will be collected and sent as the body to the HTTP
                      request.
                  close
                  -----
                  Close the connection to the server.
                  flush
                  -----
                  Flush data written to the server.
                  readavailable
                  -------------
                  Close the write end of the connection and read all available data from
                  the server.
                  If the connection to the server encompasses multiple pipes, we poll both
                  pipes and read available data.
                  readline
                  --------
                  Read a line of output from the server. If there are multiple output
                  pipes, reads only the main pipe.
                  ereadline
                  ---------
                  Like ``readline``, but read from the stderr pipe, if available.
                  read <X>
                  --------
                  ``read()`` N bytes from the server's main output pipe.
                  eread <X>
                  ---------
                  ``read()`` N bytes from the server's stderr pipe, if available.
                  Specifying Unified Frame-Based Protocol Frames
                  ----------------------------------------------
                  It is possible to emit a *Unified Frame-Based Protocol* by using special
                  syntax.
                  A frame is composed as a type, flags, and payload. These can be parsed
                  from a string of the form:
                     <request-id> <stream-id> <stream-flags> <type> <flags> <payload>
                  ``request-id`` and ``stream-id`` are integers defining the request and
                  stream identifiers.
                  ``type`` can be an integer value for the frame type or the string name
                  of the type. The strings are defined in ``wireprotoframing.py``. e.g.
                  ``command-name``.
                  ``stream-flags`` and ``flags`` are a ``|`` delimited list of flag
                  components. Each component (and there can be just one) can be an integer
                  or a flag name for stream flags or frame flags, respectively. Values are
                  resolved to integers and then bitwise OR'd together.
                  ``payload`` represents the raw frame payload. If it begins with
                  ``cbor:``, the following string is evaluated as Python code and the
                  resulting object is fed into a CBOR encoder. Otherwise it is interpreted
                  as a Python byte string literal.
                  """
                  opts = pycompat.byteskwargs(opts)
                  if opts['localssh'] and not repo:
                      raise error.Abort(_('--localssh requires a repository'))
                  if opts['peer'] and opts['peer'] not in ('raw', 'http2', 'ssh1', 'ssh2'):
                      raise error.Abort(_('invalid value for --peer'),
                                        hint=_('valid values are "raw", "ssh1", and "ssh2"'))
                  if path and opts['localssh']:
                      raise error.Abort(_('cannot specify --localssh with an explicit '
                                          'path'))
                  if ui.interactive():
                      ui.write(_('(waiting for commands on stdin)\n'))
                  blocks = list(_parsewirelangblocks(ui.fin))
                  proc = None
                  stdin = None
                  stdout = None
                  stderr = None
                  opener = None
                  if opts['localssh']:
                      # We start the SSH server in its own process so there is process
                      # separation. This prevents a whole class of potential bugs around
                      # shared state from interfering with server operation.
                      args = procutil.hgcmd() + [
                          '-R', repo.root,
                          'debugserve', '--sshstdio',
                      ]
                      proc = subprocess.Popen(args, stdin=subprocess.PIPE,
                                              stdout=subprocess.PIPE, stderr=subprocess.PIPE,
                                              bufsize=0)
                      stdin = proc.stdin
                      stdout = proc.stdout
                      stderr = proc.stderr
                      # We turn the pipes into observers so we can log I/O.
                      if ui.verbose or opts['peer'] == 'raw':
                          stdin = util.makeloggingfileobject(ui, proc.stdin, b'i',
                                                             logdata=True)
                          stdout = util.makeloggingfileobject(ui, proc.stdout, b'o',
                                                              logdata=True)
                          stderr = util.makeloggingfileobject(ui, proc.stderr, b'e',
                                                              logdata=True)
                      # --localssh also implies the peer connection settings.
                      url = 'ssh://localserver'
                      autoreadstderr = not opts['noreadstderr']
                      if opts['peer'] == 'ssh1':
                          ui.write(_('creating ssh peer for wire protocol version 1\n'))
                          peer = sshpeer.sshv1peer(ui, url, proc, stdin, stdout, stderr,
                                                   None, autoreadstderr=autoreadstderr)
                      elif opts['peer'] == 'ssh2':
                          ui.write(_('creating ssh peer for wire protocol version 2\n'))
                          peer = sshpeer.sshv2peer(ui, url, proc, stdin, stdout, stderr,
                                                   None, autoreadstderr=autoreadstderr)
                      elif opts['peer'] == 'raw':
                          ui.write(_('using raw connection to peer\n'))
                          peer = None
                      else:
                          ui.write(_('creating ssh peer from handshake results\n'))
                          peer = sshpeer.makepeer(ui, url, proc, stdin, stdout, stderr,
                                                  autoreadstderr=autoreadstderr)
                  elif path:
                      # We bypass hg.peer() so we can proxy the sockets.
                      # TODO consider not doing this because we skip
                      # ``hg.wirepeersetupfuncs`` and potentially other useful functionality.
                      u = util.url(path)
                      if u.scheme != 'http':
                          raise error.Abort(_('only http:// paths are currently supported'))
                      url, authinfo = u.authinfo()
                      openerargs = {
                          r'useragent': b'Mercurial debugwireproto',
                      }
                      # Turn pipes/sockets into observers so we can log I/O.
                      if ui.verbose:
                          openerargs.update({
                              r'loggingfh': ui,
                              r'loggingname': b's',
                              r'loggingopts': {
                                  r'logdata': True,
                                  r'logdataapis': False,
                              },
                          })
                      if ui.debugflag:
                          openerargs[r'loggingopts'][r'logdataapis'] = True
                      # Don't send default headers when in raw mode. This allows us to
                      # bypass most of the behavior of our URL handling code so we can
                      # have near complete control over what's sent on the wire.
                      if opts['peer'] == 'raw':
                          openerargs[r'sendaccept'] = False
                      opener = urlmod.opener(ui, authinfo, **openerargs)
                      if opts['peer'] == 'http2':
                          ui.write(_('creating http peer for wire protocol version 2\n'))
                          # We go through makepeer() because we need an API descriptor for
                          # the peer instance to be useful.
                          with ui.configoverride({
                              ('experimental', 'httppeer.advertise-v2'): True}):
                              if opts['nologhandshake']:
                                  ui.pushbuffer()
                              peer = httppeer.makepeer(ui, path, opener=opener)
                              if opts['nologhandshake']:
                                  ui.popbuffer()
                          if not isinstance(peer, httppeer.httpv2peer):
                              raise error.Abort(_('could not instantiate HTTP peer for '
                                                  'wire protocol version 2'),
                                                hint=_('the server may not have the feature '
                                                       'enabled or is not allowing this '
                                                       'client version'))
                      elif opts['peer'] == 'raw':
                          ui.write(_('using raw connection to peer\n'))
                          peer = None
                      elif opts['peer']:
                          raise error.Abort(_('--peer %s not supported with HTTP peers') %
                                            opts['peer'])
                      else:
                          peer = httppeer.makepeer(ui, path, opener=opener)
                      # We /could/ populate stdin/stdout with sock.makefile()...
                  else:
                      raise error.Abort(_('unsupported connection configuration'))
                  batchedcommands = None
                  # Now perform actions based on the parsed wire language instructions.
                  for action, lines in blocks:
                      if action in ('raw', 'raw+'):
                          if not stdin:
                              raise error.Abort(_('cannot call raw/raw+ on this peer'))
                          # Concatenate the data together.
                          data = ''.join(l.lstrip() for l in lines)
                          data = stringutil.unescapestr(data)
                          stdin.write(data)
                          if action == 'raw+':
                              stdin.flush()
                      elif action == 'flush':
                          if not stdin:
                              raise error.Abort(_('cannot call flush on this peer'))
                          stdin.flush()
                      elif action.startswith('command'):
                          if not peer:
                              raise error.Abort(_('cannot send commands unless peer instance '
                                                  'is available'))
                          command = action.split(' ', 1)[1]
                          args = {}
                          for line in lines:
                              # We need to allow empty values.
                              fields = line.lstrip().split(' ', 1)
                              if len(fields) == 1:
                                  key = fields[0]
                                  value = ''
                              else:
                                  key, value = fields
                              if value.startswith('eval:'):
                                  value = stringutil.evalpythonliteral(value[5:])
                              else:
                                  value = stringutil.unescapestr(value)
                              args[key] = value
                          if batchedcommands is not None:
                              batchedcommands.append((command, args))
                              continue
                          ui.status(_('sending %s command\n') % command)
                          if 'PUSHFILE' in args:
                              with open(args['PUSHFILE'], r'rb') as fh:
                                  del args['PUSHFILE']
                                  res, output = peer._callpush(command, fh,
                                                               **pycompat.strkwargs(args))
                                  ui.status(_('result: %s\n') % stringutil.escapestr(res))
                                  ui.status(_('remote output: %s\n') %
                                            stringutil.escapestr(output))
                          else:
                              with peer.commandexecutor() as e:
                                  res = e.callcommand(command, args).result()
                              if isinstance(res, wireprotov2peer.commandresponse):
                                  val = list(res.cborobjects())
                                  ui.status(_('response: %s\n') %
                                            stringutil.pprint(val, bprefix=True))
                              else:
                                  ui.status(_('response: %s\n') %
                                            stringutil.pprint(res, bprefix=True))
                      elif action == 'batchbegin':
                          if batchedcommands is not None:
                              raise error.Abort(_('nested batchbegin not allowed'))
                          batchedcommands = []
                      elif action == 'batchsubmit':
                          # There is a batching API we could go through. But it would be
                          # difficult to normalize requests into function calls. It is easier
                          # to bypass this layer and normalize to commands + args.
                          ui.status(_('sending batch with %d sub-commands\n') %
                                    len(batchedcommands))
                          for i, chunk in enumerate(peer._submitbatch(batchedcommands)):
                              ui.status(_('response #%d: %s\n') %
                                        (i, stringutil.escapestr(chunk)))
                          batchedcommands = None
                      elif action.startswith('httprequest '):
                          if not opener:
                              raise error.Abort(_('cannot use httprequest without an HTTP '
                                                  'peer'))
                          request = action.split(' ', 2)
                          if len(request) != 3:
                              raise error.Abort(_('invalid httprequest: expected format is '
                                                  '"httprequest <method> <path>'))
                          method, httppath = request[1:]
                          headers = {}
                          body = None
                          frames = []
                          for line in lines:
                              line = line.lstrip()
                              m = re.match(b'^([a-zA-Z0-9_-]+): (.*)$', line)
                              if m:
                                  headers[m.group(1)] = m.group(2)
                                  continue
                              if line.startswith(b'BODYFILE '):
                                  with open(line.split(b' ', 1), 'rb') as fh:
                                      body = fh.read()
                              elif line.startswith(b'frame '):
                                  frame = wireprotoframing.makeframefromhumanstring(
                                      line[len(b'frame '):])
                                  frames.append(frame)
                              else:
                                  raise error.Abort(_('unknown argument to httprequest: %s') %
                                                    line)
                          url = path + httppath
                          if frames:
                              body = b''.join(bytes(f) for f in frames)
                          req = urlmod.urlreq.request(pycompat.strurl(url), body, headers)
                          # urllib.Request insists on using has_data() as a proxy for
                          # determining the request method. Override that to use our
                          # explicitly requested method.
                          req.get_method = lambda: pycompat.sysstr(method)
                          try:
                              res = opener.open(req)
                              body = res.read()
                          except util.urlerr.urlerror as e:
                              # read() method must be called, but only exists in Python 2
                              getattr(e, 'read', lambda: None)()
                              continue
                          if res.headers.get('Content-Type') == 'application/mercurial-cbor':
                              ui.write(_('cbor> %s\n') %
                                       stringutil.pprint(cbor.loads(body), bprefix=True))
                      elif action == 'close':
                          peer.close()
                      elif action == 'readavailable':
                          if not stdout or not stderr:
                              raise error.Abort(_('readavailable not available on this peer'))
                          stdin.close()
                          stdout.read()
                          stderr.read()
                      elif action == 'readline':
                          if not stdout:
                              raise error.Abort(_('readline not available on this peer'))
                          stdout.readline()
                      elif action == 'ereadline':
                          if not stderr:
                              raise error.Abort(_('ereadline not available on this peer'))
                          stderr.readline()
                      elif action.startswith('read '):
                          count = int(action.split(' ', 1)[1])
                          if not stdout:
                              raise error.Abort(_('read not available on this peer'))
                          stdout.read(count)
                      elif action.startswith('eread '):
                          count = int(action.split(' ', 1)[1])
                          if not stderr:
                              raise error.Abort(_('eread not available on this peer'))
                          stderr.read(count)
                      else:
                          raise error.Abort(_('unknown action: %s') % action)
                  if batchedcommands is not None:
                      raise error.Abort(_('unclosed "batchbegin" request'))
                  if peer:
                      peer.close()
                  if proc:
                      proc.kill()

mercurial/revlog.py

0 +9 -700

              # revlog.py - storage back-end for mercurial
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              """Storage back-end for Mercurial.
              This provides efficient delta storage with O(1) retrieve and append
              and O(changes) merge between branches.
              """
              from __future__ import absolute_import
              import collections
              import contextlib
              import errno
              import hashlib
-             import heapq
              import os
              import re
              import struct
              import zlib
              # import stuff from node for others to import from revlog
              from .node import (
                  bin,
                  hex,
                  nullhex,
                  nullid,
                  nullrev,
                  wdirfilenodeids,
                  wdirhex,
                  wdirid,
                  wdirrev,
              )
              from .i18n import _
              from .revlogutils.constants import (
                  FLAG_GENERALDELTA,
                  FLAG_INLINE_DATA,
-                 LIMIT_DELTA2TEXT,
                  REVIDX_DEFAULT_FLAGS,
                  REVIDX_ELLIPSIS,
                  REVIDX_EXTSTORED,
                  REVIDX_FLAGS_ORDER,
                  REVIDX_ISCENSORED,
                  REVIDX_KNOWN_FLAGS,
                  REVIDX_RAWTEXT_CHANGING_FLAGS,
                  REVLOGV0,
                  REVLOGV1,
                  REVLOGV1_FLAGS,
                  REVLOGV2,
                  REVLOGV2_FLAGS,
                  REVLOG_DEFAULT_FLAGS,
                  REVLOG_DEFAULT_FORMAT,
                  REVLOG_DEFAULT_VERSION,
              )
              from .thirdparty import (
                  attr,
              )
              from . import (
                  ancestor,
                  error,
                  mdiff,
                  policy,
                  pycompat,
                  repository,
                  templatefilters,
                  util,
              )
+             from .revlogutils import (
+                 deltas as deltautil,
+             )
              from .utils import (
                  interfaceutil,
                  stringutil,
              )
              # blanked usage of all the name to prevent pyflakes constraints
              # We need these name available in the module for extensions.
              REVLOGV0
              REVLOGV1
              REVLOGV2
              FLAG_INLINE_DATA
              FLAG_GENERALDELTA
              REVLOG_DEFAULT_FLAGS
              REVLOG_DEFAULT_FORMAT
              REVLOG_DEFAULT_VERSION
              REVLOGV1_FLAGS
              REVLOGV2_FLAGS
              REVIDX_ISCENSORED
              REVIDX_ELLIPSIS
              REVIDX_EXTSTORED
              REVIDX_DEFAULT_FLAGS
              REVIDX_FLAGS_ORDER
              REVIDX_KNOWN_FLAGS
              REVIDX_RAWTEXT_CHANGING_FLAGS
              parsers = policy.importmod(r'parsers')
              # Aliased for performance.
              _zlibdecompress = zlib.decompress
              # max size of revlog with inline data
              _maxinline = 131072
              _chunksize = 1048576
              RevlogError = error.RevlogError
              LookupError = error.LookupError
              AmbiguousPrefixLookupError = error.AmbiguousPrefixLookupError
              CensoredNodeError = error.CensoredNodeError
              ProgrammingError = error.ProgrammingError
              # Store flag processors (cf. 'addflagprocessor()' to register)
              _flagprocessors = {
                  REVIDX_ISCENSORED: None,
              }
              _mdre = re.compile('\1\n')
              def parsemeta(text):
                  """return (metadatadict, metadatasize)"""
                  # text can be buffer, so we can't use .startswith or .index
                  if text[:2] != '\1\n':
                      return None, None
                  s = _mdre.search(text, 2).start()
                  mtext = text[2:s]
                  meta = {}
                  for l in mtext.splitlines():
                      k, v = l.split(": ", 1)
                      meta[k] = v
                  return meta, (s + 2)
              def packmeta(meta, text):
                  keys = sorted(meta)
                  metatext = "".join("%s: %s\n" % (k, meta[k]) for k in keys)
                  return "\1\n%s\1\n%s" % (metatext, text)
              def _censoredtext(text):
                  m, offs = parsemeta(text)
                  return m and "censored" in m
              def addflagprocessor(flag, processor):
                  """Register a flag processor on a revision data flag.
                  Invariant:
                  - Flags need to be defined in REVIDX_KNOWN_FLAGS and REVIDX_FLAGS_ORDER,
                    and REVIDX_RAWTEXT_CHANGING_FLAGS if they can alter rawtext.
                  - Only one flag processor can be registered on a specific flag.
                  - flagprocessors must be 3-tuples of functions (read, write, raw) with the
                    following signatures:
                        - (read)  f(self, rawtext) -> text, bool
                        - (write) f(self, text) -> rawtext, bool
                        - (raw)   f(self, rawtext) -> bool
                    "text" is presented to the user. "rawtext" is stored in revlog data, not
                    directly visible to the user.
                    The boolean returned by these transforms is used to determine whether
                    the returned text can be used for hash integrity checking. For example,
                    if "write" returns False, then "text" is used to generate hash. If
                    "write" returns True, that basically means "rawtext" returned by "write"
                    should be used to generate hash. Usually, "write" and "read" return
                    different booleans. And "raw" returns a same boolean as "write".
                    Note: The 'raw' transform is used for changegroup generation and in some
                    debug commands. In this case the transform only indicates whether the
                    contents can be used for hash integrity checks.
                  """
                  if not flag & REVIDX_KNOWN_FLAGS:
                      msg = _("cannot register processor on unknown flag '%#x'.") % (flag)
                      raise ProgrammingError(msg)
                  if flag not in REVIDX_FLAGS_ORDER:
                      msg = _("flag '%#x' undefined in REVIDX_FLAGS_ORDER.") % (flag)
                      raise ProgrammingError(msg)
                  if flag in _flagprocessors:
                      msg = _("cannot register multiple processors on flag '%#x'.") % (flag)
                      raise error.Abort(msg)
                  _flagprocessors[flag] = processor
              def getoffset(q):
                  return int(q >> 16)
              def gettype(q):
                  return int(q & 0xFFFF)
              def offset_type(offset, type):
                  if (type & ~REVIDX_KNOWN_FLAGS) != 0:
                      raise ValueError('unknown revlog index flags')
                  return int(int(offset) << 16 | type)
              _nullhash = hashlib.sha1(nullid)
              def hash(text, p1, p2):
                  """generate a hash from the given text and its parent hashes
                  This hash combines both the current file contents and its history
                  in a manner that makes it easy to distinguish nodes with the same
                  content in the revision graph.
                  """
                  # As of now, if one of the parent node is null, p2 is null
                  if p2 == nullid:
                      # deep copy of a hash is faster than creating one
                      s = _nullhash.copy()
                      s.update(p1)
                  else:
                      # none of the parent nodes are nullid
                      if p1 < p2:
                          a = p1
                          b = p2
                      else:
                          a = p2
                          b = p1
                      s = hashlib.sha1(a)
                      s.update(b)
                  s.update(text)
                  return s.digest()
-             class _testrevlog(object):
-                 """minimalist fake revlog to use in doctests"""
-                 def __init__(self, data, density=0.5, mingap=0):
-                     """data is an list of revision payload boundaries"""
-                     self._data = data
-                     self._srdensitythreshold = density
-                     self._srmingapsize = mingap
-                 def start(self, rev):
-                     if rev == 0:
-                         return 0
-                     return self._data[rev - 1]
-                 def end(self, rev):
-                     return self._data[rev]
-                 def length(self, rev):
-                     return self.end(rev) - self.start(rev)
-                 def __len__(self):
-                     return len(self._data)
-             def _trimchunk(revlog, revs, startidx, endidx=None):
-                 """returns revs[startidx:endidx] without empty trailing revs
-                 Doctest Setup
-                 >>> revlog = _testrevlog([
-                 ...  5,  #0
-                 ...  10, #1
-                 ...  12, #2
-                 ...  12, #3 (empty)
-                 ...  17, #4
-                 ...  21, #5
-                 ...  21, #6 (empty)
-                 ... ])
-                 Contiguous cases:
-                 >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0)
-                 [0, 1, 2, 3, 4, 5]
-                 >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 5)
-                 [0, 1, 2, 3, 4]
-                 >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 4)
-                 [0, 1, 2]
-                 >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 2, 4)
-                 [2]
-                 >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3)
-                 [3, 4, 5]
-                 >>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3, 5)
-                 [3, 4]
-                 Discontiguous cases:
-                 >>> _trimchunk(revlog, [1, 3, 5, 6], 0)
-                 [1, 3, 5]
-                 >>> _trimchunk(revlog, [1, 3, 5, 6], 0, 2)
-                 [1]
-                 >>> _trimchunk(revlog, [1, 3, 5, 6], 1, 3)
-                 [3, 5]
-                 >>> _trimchunk(revlog, [1, 3, 5, 6], 1)
-                 [3, 5]
-                 """
-                 length = revlog.length
-                 if endidx is None:
-                     endidx = len(revs)
-                 # If we have a non-emtpy delta candidate, there are nothing to trim
-                 if revs[endidx - 1] < len(revlog):
-                     # Trim empty revs at the end, except the very first revision of a chain
-                     while (endidx > 1
-                             and endidx > startidx
-                             and length(revs[endidx - 1]) == 0):
-                         endidx -= 1
-                 return revs[startidx:endidx]
-             def _segmentspan(revlog, revs, deltainfo=None):
-                 """Get the byte span of a segment of revisions
-                 revs is a sorted array of revision numbers
-                 >>> revlog = _testrevlog([
-                 ...  5,  #0
-                 ...  10, #1
-                 ...  12, #2
-                 ...  12, #3 (empty)
-                 ...  17, #4
-                 ... ])
-                 >>> _segmentspan(revlog, [0, 1, 2, 3, 4])
-                 >>> _segmentspan(revlog, [0, 4])
-                 >>> _segmentspan(revlog, [3, 4])
-                 >>> _segmentspan(revlog, [1, 2, 3,])
-                 >>> _segmentspan(revlog, [1, 3])
-                 """
-                 if not revs:
-                     return 0
-                 if deltainfo is not None and len(revlog) <= revs[-1]:
-                     if len(revs) == 1:
-                         return deltainfo.deltalen
-                     offset = revlog.end(len(revlog) - 1)
-                     end = deltainfo.deltalen + offset
-                 else:
-                     end = revlog.end(revs[-1])
-                 return end - revlog.start(revs[0])
-             def _slicechunk(revlog, revs, deltainfo=None, targetsize=None):
-                 """slice revs to reduce the amount of unrelated data to be read from disk.
-                 ``revs`` is sliced into groups that should be read in one time.
-                 Assume that revs are sorted.
-                 The initial chunk is sliced until the overall density (payload/chunks-span
-                 ratio) is above `revlog._srdensitythreshold`. No gap smaller than
-                 `revlog._srmingapsize` is skipped.
-                 If `targetsize` is set, no chunk larger than `targetsize` will be yield.
-                 For consistency with other slicing choice, this limit won't go lower than
-                 `revlog._srmingapsize`.
-                 If individual revisions chunk are larger than this limit, they will still
-                 be raised individually.
-                 >>> revlog = _testrevlog([
-                 ...  5,  #00 (5)
-                 ...  10, #01 (5)
-                 ...  12, #02 (2)
-                 ...  12, #03 (empty)
-                 ...  27, #04 (15)
-                 ...  31, #05 (4)
-                 ...  31, #06 (empty)
-                 ...  42, #07 (11)
-                 ...  47, #08 (5)
-                 ...  47, #09 (empty)
-                 ...  48, #10 (1)
-                 ...  51, #11 (3)
-                 ...  74, #12 (23)
-                 ...  85, #13 (11)
-                 ...  86, #14 (1)
-                 ...  91, #15 (5)
-                 ... ])
-                 >>> list(_slicechunk(revlog, list(range(16))))
-                 [[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
-                 >>> list(_slicechunk(revlog, [0, 15]))
-                 [[0], [15]]
-                 >>> list(_slicechunk(revlog, [0, 11, 15]))
-                 [[0], [11], [15]]
-                 >>> list(_slicechunk(revlog, [0, 11, 13, 15]))
-                 [[0], [11, 13, 15]]
-                 >>> list(_slicechunk(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
-                 [[1, 2], [5, 8, 10, 11], [14]]
-                 Slicing with a maximum chunk size
-                 >>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=15))
-                 [[0], [11], [13], [15]]
-                 >>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=20))
-                 [[0], [11], [13, 15]]
-                 """
-                 if targetsize is not None:
-                     targetsize = max(targetsize, revlog._srmingapsize)
-                 # targetsize should not be specified when evaluating delta candidates:
-                 # * targetsize is used to ensure we stay within specification when reading,
-                 # * deltainfo is used to pick are good delta chain when writing.
-                 if not (deltainfo is None or targetsize is None):
-                     msg = 'cannot use `targetsize` with a `deltainfo`'
-                     raise error.ProgrammingError(msg)
-                 for chunk in _slicechunktodensity(revlog, revs,
-                                                   deltainfo,
-                                                   revlog._srdensitythreshold,
-                                                   revlog._srmingapsize):
-                     for subchunk in _slicechunktosize(revlog, chunk, targetsize):
-                         yield subchunk
-             def _slicechunktosize(revlog, revs, targetsize=None):
-                 """slice revs to match the target size
-                 This is intended to be used on chunk that density slicing selected by that
-                 are still too large compared to the read garantee of revlog. This might
-                 happens when "minimal gap size" interrupted the slicing or when chain are
-                 built in a way that create large blocks next to each other.
-                 >>> revlog = _testrevlog([
-                 ...  3,  #0 (3)
-                 ...  5,  #1 (2)
-                 ...  6,  #2 (1)
-                 ...  8,  #3 (2)
-                 ...  8,  #4 (empty)
-                 ...  11, #5 (3)
-                 ...  12, #6 (1)
-                 ...  13, #7 (1)
-                 ...  14, #8 (1)
-                 ... ])
-                 Cases where chunk is already small enough
-                 >>> list(_slicechunktosize(revlog, [0], 3))
-                 [[0]]
-                 >>> list(_slicechunktosize(revlog, [6, 7], 3))
-                 [[6, 7]]
-                 >>> list(_slicechunktosize(revlog, [0], None))
-                 [[0]]
-                 >>> list(_slicechunktosize(revlog, [6, 7], None))
-                 [[6, 7]]
-                 cases where we need actual slicing
-                 >>> list(_slicechunktosize(revlog, [0, 1], 3))
-                 [[0], [1]]
-                 >>> list(_slicechunktosize(revlog, [1, 3], 3))
-                 [[1], [3]]
-                 >>> list(_slicechunktosize(revlog, [1, 2, 3], 3))
-                 [[1, 2], [3]]
-                 >>> list(_slicechunktosize(revlog, [3, 5], 3))
-                 [[3], [5]]
-                 >>> list(_slicechunktosize(revlog, [3, 4, 5], 3))
-                 [[3], [5]]
-                 >>> list(_slicechunktosize(revlog, [5, 6, 7, 8], 3))
-                 [[5], [6, 7, 8]]
-                 >>> list(_slicechunktosize(revlog, [0, 1, 2, 3, 4, 5, 6, 7, 8], 3))
-                 [[0], [1, 2], [3], [5], [6, 7, 8]]
-                 Case with too large individual chunk (must return valid chunk)
-                 >>> list(_slicechunktosize(revlog, [0, 1], 2))
-                 [[0], [1]]
-                 >>> list(_slicechunktosize(revlog, [1, 3], 1))
-                 [[1], [3]]
-                 >>> list(_slicechunktosize(revlog, [3, 4, 5], 2))
-                 [[3], [5]]
-                 """
-                 assert targetsize is None or 0 <= targetsize
-                 if targetsize is None or _segmentspan(revlog, revs) <= targetsize:
-                     yield revs
-                     return
-                 startrevidx = 0
-                 startdata = revlog.start(revs[0])
-                 endrevidx = 0
-                 iterrevs = enumerate(revs)
-                 next(iterrevs) # skip first rev.
-                 for idx, r in iterrevs:
-                     span = revlog.end(r) - startdata
-                     if span <= targetsize:
-                         endrevidx = idx
-                     else:
-                         chunk = _trimchunk(revlog, revs, startrevidx, endrevidx + 1)
-                         if chunk:
-                             yield chunk
-                         startrevidx = idx
-                         startdata = revlog.start(r)
-                         endrevidx = idx
-                 yield _trimchunk(revlog, revs, startrevidx)
-             def _slicechunktodensity(revlog, revs, deltainfo=None, targetdensity=0.5,
-                                      mingapsize=0):
-                 """slice revs to reduce the amount of unrelated data to be read from disk.
-                 ``revs`` is sliced into groups that should be read in one time.
-                 Assume that revs are sorted.
-                 ``deltainfo`` is a _deltainfo instance of a revision that we would append
-                 to the top of the revlog.
-                 The initial chunk is sliced until the overall density (payload/chunks-span
-                 ratio) is above `targetdensity`. No gap smaller than `mingapsize` is
-                 skipped.
-                 >>> revlog = _testrevlog([
-                 ...  5,  #00 (5)
-                 ...  10, #01 (5)
-                 ...  12, #02 (2)
-                 ...  12, #03 (empty)
-                 ...  27, #04 (15)
-                 ...  31, #05 (4)
-                 ...  31, #06 (empty)
-                 ...  42, #07 (11)
-                 ...  47, #08 (5)
-                 ...  47, #09 (empty)
-                 ...  48, #10 (1)
-                 ...  51, #11 (3)
-                 ...  74, #12 (23)
-                 ...  85, #13 (11)
-                 ...  86, #14 (1)
-                 ...  91, #15 (5)
-                 ... ])
-                 >>> list(_slicechunktodensity(revlog, list(range(16))))
-                 [[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
-                 >>> list(_slicechunktodensity(revlog, [0, 15]))
-                 [[0], [15]]
-                 >>> list(_slicechunktodensity(revlog, [0, 11, 15]))
-                 [[0], [11], [15]]
-                 >>> list(_slicechunktodensity(revlog, [0, 11, 13, 15]))
-                 [[0], [11, 13, 15]]
-                 >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
-                 [[1, 2], [5, 8, 10, 11], [14]]
-                 >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
-                 ...                           mingapsize=20))
-                 [[1, 2, 3, 5, 8, 10, 11], [14]]
-                 >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
-                 ...                           targetdensity=0.95))
-                 [[1, 2], [5], [8, 10, 11], [14]]
-                 >>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
-                 ...                           targetdensity=0.95, mingapsize=12))
-                 [[1, 2], [5, 8, 10, 11], [14]]
-                 """
-                 start = revlog.start
-                 length = revlog.length
-                 if len(revs) <= 1:
-                     yield revs
-                     return
-                 nextrev = len(revlog)
-                 nextoffset = revlog.end(nextrev - 1)
-                 if deltainfo is None:
-                     deltachainspan = _segmentspan(revlog, revs)
-                     chainpayload = sum(length(r) for r in revs)
-                 else:
-                     deltachainspan = deltainfo.distance
-                     chainpayload = deltainfo.compresseddeltalen
-                 if deltachainspan < mingapsize:
-                     yield revs
-                     return
-                 readdata = deltachainspan
-                 if deltachainspan:
-                     density = chainpayload / float(deltachainspan)
-                 else:
-                     density = 1.0
-                 if density >= targetdensity:
-                     yield revs
-                     return
-                 if deltainfo is not None and deltainfo.deltalen:
-                     revs = list(revs)
-                     revs.append(nextrev)
-                 # Store the gaps in a heap to have them sorted by decreasing size
-                 gapsheap = []
-                 heapq.heapify(gapsheap)
-                 prevend = None
-                 for i, rev in enumerate(revs):
-                     if rev < nextrev:
-                         revstart = start(rev)
-                         revlen = length(rev)
-                     else:
-                         revstart = nextoffset
-                         revlen = deltainfo.deltalen
-                     # Skip empty revisions to form larger holes
-                     if revlen == 0:
-                         continue
-                     if prevend is not None:
-                         gapsize = revstart - prevend
-                         # only consider holes that are large enough
-                         if gapsize > mingapsize:
-                             heapq.heappush(gapsheap, (-gapsize, i))
-                     prevend = revstart + revlen
-                 # Collect the indices of the largest holes until the density is acceptable
-                 indicesheap = []
-                 heapq.heapify(indicesheap)
-                 while gapsheap and density < targetdensity:
-                     oppgapsize, gapidx = heapq.heappop(gapsheap)
-                     heapq.heappush(indicesheap, gapidx)
-                     # the gap sizes are stored as negatives to be sorted decreasingly
-                     # by the heap
-                     readdata -= (-oppgapsize)
-                     if readdata > 0:
-                         density = chainpayload / float(readdata)
-                     else:
-                         density = 1.0
-                 # Cut the revs at collected indices
-                 previdx = 0
-                 while indicesheap:
-                     idx = heapq.heappop(indicesheap)
-                     chunk = _trimchunk(revlog, revs, previdx, idx)
-                     if chunk:
-                         yield chunk
-                     previdx = idx
-                 chunk = _trimchunk(revlog, revs, previdx)
-                 if chunk:
-                     yield chunk
-             @attr.s(slots=True, frozen=True)
-             class _deltainfo(object):
-                 distance = attr.ib()
-                 deltalen = attr.ib()
-                 data = attr.ib()
-                 base = attr.ib()
-                 chainbase = attr.ib()
-                 chainlen = attr.ib()
-                 compresseddeltalen = attr.ib()
-                 snapshotdepth = attr.ib()
-             class _deltacomputer(object):
-                 def __init__(self, revlog):
-                     self.revlog = revlog
-                 def _getcandidaterevs(self, p1, p2, cachedelta):
-                     """
-                     Provides revisions that present an interest to be diffed against,
-                     grouped by level of easiness.
-                     """
-                     revlog = self.revlog
-                     gdelta = revlog._generaldelta
-                     curr = len(revlog)
-                     prev = curr - 1
-                     p1r, p2r = revlog.rev(p1), revlog.rev(p2)
-                     # should we try to build a delta?
-                     if prev != nullrev and revlog._storedeltachains:
-                         tested = set()
-                         # This condition is true most of the time when processing
-                         # changegroup data into a generaldelta repo. The only time it
-                         # isn't true is if this is the first revision in a delta chain
-                         # or if ``format.generaldelta=true`` disabled ``lazydeltabase``.
-                         if cachedelta and gdelta and revlog._lazydeltabase:
-                             # Assume what we received from the server is a good choice
-                             # build delta will reuse the cache
-                             yield (cachedelta[0],)
-                             tested.add(cachedelta[0])
-                         if gdelta:
-                             # exclude already lazy tested base if any
-                             parents = [p for p in (p1r, p2r)
-                                        if p != nullrev and p not in tested]
-                             if not revlog._deltabothparents and len(parents) == 2:
-                                 parents.sort()
-                                 # To minimize the chance of having to build a fulltext,
-                                 # pick first whichever parent is closest to us (max rev)
-                                 yield (parents[1],)
-                                 # then the other one (min rev) if the first did not fit
-                                 yield (parents[0],)
-                                 tested.update(parents)
-                             elif len(parents) > 0:
-                                 # Test all parents (1 or 2), and keep the best candidate
-                                 yield parents
-                                 tested.update(parents)
-                         if prev not in tested:
-                             # other approach failed try against prev to hopefully save us a
-                             # fulltext.
-                             yield (prev,)
-                             tested.add(prev)
-                 def buildtext(self, revinfo, fh):
-                     """Builds a fulltext version of a revision
-                     revinfo: _revisioninfo instance that contains all needed info
-                     fh:      file handle to either the .i or the .d revlog file,
-                              depending on whether it is inlined or not
-                     """
-                     btext = revinfo.btext
-                     if btext[0] is not None:
-                         return btext[0]
-                     revlog = self.revlog
-                     cachedelta = revinfo.cachedelta
-                     flags = revinfo.flags
-                     node = revinfo.node
-                     baserev = cachedelta[0]
-                     delta = cachedelta[1]
-                     # special case deltas which replace entire base; no need to decode
-                     # base revision. this neatly avoids censored bases, which throw when
-                     # they're decoded.
-                     hlen = struct.calcsize(">lll")
-                     if delta[:hlen] == mdiff.replacediffheader(revlog.rawsize(baserev),
-                                                                len(delta) - hlen):
-                         btext[0] = delta[hlen:]
-                     else:
-                         # deltabase is rawtext before changed by flag processors, which is
-                         # equivalent to non-raw text
-                         basetext = revlog.revision(baserev, _df=fh, raw=False)
-                         btext[0] = mdiff.patch(basetext, delta)
-                     try:
-                         res = revlog._processflags(btext[0], flags, 'read', raw=True)
-                         btext[0], validatehash = res
-                         if validatehash:
-                             revlog.checkhash(btext[0], node, p1=revinfo.p1, p2=revinfo.p2)
-                         if flags & REVIDX_ISCENSORED:
-                             raise RevlogError(_('node %s is not censored') % node)
-                     except CensoredNodeError:
-                         # must pass the censored index flag to add censored revisions
-                         if not flags & REVIDX_ISCENSORED:
-                             raise
-                     return btext[0]
-                 def _builddeltadiff(self, base, revinfo, fh):
-                     revlog = self.revlog
-                     t = self.buildtext(revinfo, fh)
-                     if revlog.iscensored(base):
-                         # deltas based on a censored revision must replace the
-                         # full content in one patch, so delta works everywhere
-                         header = mdiff.replacediffheader(revlog.rawsize(base), len(t))
-                         delta = header + t
-                     else:
-                         ptext = revlog.revision(base, _df=fh, raw=True)
-                         delta = mdiff.textdiff(ptext, t)
-                     return delta
-                 def _builddeltainfo(self, revinfo, base, fh):
-                     # can we use the cached delta?
-                     if revinfo.cachedelta and revinfo.cachedelta[0] == base:
-                         delta = revinfo.cachedelta[1]
-                     else:
-                         delta = self._builddeltadiff(base, revinfo, fh)
-                     revlog = self.revlog
-                     header, data = revlog.compress(delta)
-                     deltalen = len(header) + len(data)
-                     chainbase = revlog.chainbase(base)
-                     offset = revlog.end(len(revlog) - 1)
-                     dist = deltalen + offset - revlog.start(chainbase)
-                     if revlog._generaldelta:
-                         deltabase = base
-                     else:
-                         deltabase = chainbase
-                     chainlen, compresseddeltalen = revlog._chaininfo(base)
-                     chainlen += 1
-                     compresseddeltalen += deltalen
-                     revlog = self.revlog
-                     snapshotdepth = None
-                     if deltabase == nullrev:
-                         snapshotdepth = 0
-                     elif revlog._sparserevlog and revlog.issnapshot(deltabase):
-                         # A delta chain should always be one full snapshot,
-                         # zero or more semi-snapshots, and zero or more deltas
-                         p1, p2 = revlog.rev(revinfo.p1), revlog.rev(revinfo.p2)
-                         if deltabase not in (p1, p2) and revlog.issnapshot(deltabase):
-                             snapshotdepth = len(revlog._deltachain(deltabase)[0])
-                     return _deltainfo(dist, deltalen, (header, data), deltabase,
-                                       chainbase, chainlen, compresseddeltalen,
-                                       snapshotdepth)
-                 def finddeltainfo(self, revinfo, fh):
-                     """Find an acceptable delta against a candidate revision
-                     revinfo: information about the revision (instance of _revisioninfo)
-                     fh:      file handle to either the .i or the .d revlog file,
-                              depending on whether it is inlined or not
-                     Returns the first acceptable candidate revision, as ordered by
-                     _getcandidaterevs
-                     """
-                     if not revinfo.textlen:
-                         return None # empty file do not need delta
-                     cachedelta = revinfo.cachedelta
-                     p1 = revinfo.p1
-                     p2 = revinfo.p2
-                     revlog = self.revlog
-                     deltalength = self.revlog.length
-                     deltaparent = self.revlog.deltaparent
-                     deltainfo = None
-                     deltas_limit = revinfo.textlen * LIMIT_DELTA2TEXT
-                     for candidaterevs in self._getcandidaterevs(p1, p2, cachedelta):
-                         # filter out delta base that will never produce good delta
-                         candidaterevs = [r for r in candidaterevs
-                                          if self.revlog.length(r) <= deltas_limit]
-                         nominateddeltas = []
-                         for candidaterev in candidaterevs:
-                             # skip over empty delta (no need to include them in a chain)
-                             while candidaterev != nullrev and not deltalength(candidaterev):
-                                 candidaterev = deltaparent(candidaterev)
-                             # no need to try a delta against nullid, this will be handled
-                             # by fulltext later.
-                             if candidaterev == nullrev:
-                                 continue
-                             # no delta for rawtext-changing revs (see "candelta" for why)
-                             if revlog.flags(candidaterev) & REVIDX_RAWTEXT_CHANGING_FLAGS:
-                                 continue
-                             candidatedelta = self._builddeltainfo(revinfo, candidaterev, fh)
-                             if revlog._isgooddeltainfo(candidatedelta, revinfo):
-                                 nominateddeltas.append(candidatedelta)
-                         if nominateddeltas:
-                             deltainfo = min(nominateddeltas, key=lambda x: x.deltalen)
-                             break
-                     return deltainfo
              @attr.s(slots=True, frozen=True)
              class _revisioninfo(object):
                  """Information about a revision that allows building its fulltext
                  node:       expected hash of the revision
                  p1, p2:     parent revs of the revision
                  btext:      built text cache consisting of a one-element list
                  cachedelta: (baserev, uncompressed_delta) or None
                  flags:      flags associated to the revision storage
                  One of btext[0] or cachedelta must be set.
                  """
                  node = attr.ib()
                  p1 = attr.ib()
                  p2 = attr.ib()
                  btext = attr.ib()
                  textlen = attr.ib()
                  cachedelta = attr.ib()
                  flags = attr.ib()
              @interfaceutil.implementer(repository.irevisiondelta)
              @attr.s(slots=True, frozen=True)
              class revlogrevisiondelta(object):
                  node = attr.ib()
                  p1node = attr.ib()
                  p2node = attr.ib()
                  basenode = attr.ib()
                  linknode = attr.ib()
                  flags = attr.ib()
                  baserevisionsize = attr.ib()
                  revision = attr.ib()
                  delta = attr.ib()
              # index v0:
              #  4 bytes: offset
              #  4 bytes: compressed length
              #  4 bytes: base rev
              #  4 bytes: link rev
              # 20 bytes: parent 1 nodeid
              # 20 bytes: parent 2 nodeid
              # 20 bytes: nodeid
              indexformatv0 = struct.Struct(">4l20s20s20s")
              indexformatv0_pack = indexformatv0.pack
              indexformatv0_unpack = indexformatv0.unpack
              class revlogoldindex(list):
                  def __getitem__(self, i):
                      if i == -1:
                          return (0, 0, 0, -1, -1, -1, -1, nullid)
                      return list.__getitem__(self, i)
              class revlogoldio(object):
                  def __init__(self):
                      self.size = indexformatv0.size
                  def parseindex(self, data, inline):
                      s = self.size
                      index = []
                      nodemap = {nullid: nullrev}
                      n = off = 0
                      l = len(data)
                      while off + s <= l:
                          cur = data[off:off + s]
                          off += s
                          e = indexformatv0_unpack(cur)
                          # transform to revlogv1 format
                          e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                                nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                          index.append(e2)
                          nodemap[e[6]] = n
                          n += 1
                      return revlogoldindex(index), nodemap, None
                  def packentry(self, entry, node, version, rev):
                      if gettype(entry[0]):
                          raise RevlogError(_('index entry flags need revlog version 1'))
                      e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                            node(entry[5]), node(entry[6]), entry[7])
                      return indexformatv0_pack(*e2)
              # index ng:
              #  6 bytes: offset
              #  2 bytes: flags
              #  4 bytes: compressed length
              #  4 bytes: uncompressed length
              #  4 bytes: base rev
              #  4 bytes: link rev
              #  4 bytes: parent 1 rev
              #  4 bytes: parent 2 rev
              # 32 bytes: nodeid
              indexformatng = struct.Struct(">Qiiiiii20s12x")
              indexformatng_pack = indexformatng.pack
              versionformat = struct.Struct(">I")
              versionformat_pack = versionformat.pack
              versionformat_unpack = versionformat.unpack
              # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
              # signed integer)
              _maxentrysize = 0x7fffffff
              class revlogio(object):
                  def __init__(self):
                      self.size = indexformatng.size
                  def parseindex(self, data, inline):
                      # call the C implementation to parse the index data
                      index, cache = parsers.parse_index2(data, inline)
                      return index, getattr(index, 'nodemap', None), cache
                  def packentry(self, entry, node, version, rev):
                      p = indexformatng_pack(*entry)
                      if rev == 0:
                          p = versionformat_pack(version) + p[4:]
                      return p
              class revlog(object):
                  """
                  the underlying revision storage object
                  A revlog consists of two parts, an index and the revision data.
                  The index is a file with a fixed record size containing
                  information on each revision, including its nodeid (hash), the
                  nodeids of its parents, the position and offset of its data within
                  the data file, and the revision it's based on. Finally, each entry
                  contains a linkrev entry that can serve as a pointer to external
                  data.
                  The revision data itself is a linear collection of data chunks.
                  Each chunk represents a revision and is usually represented as a
                  delta against the previous chunk. To bound lookup time, runs of
                  deltas are limited to about 2 times the length of the original
                  version data. This makes retrieval of a version proportional to
                  its size, or O(1) relative to the number of revisions.
                  Both pieces of the revlog are written to in an append-only
                  fashion, which means we never need to rewrite a file to insert or
                  remove data, and can use some simple techniques to avoid the need
                  for locking while reading.
                  If checkambig, indexfile is opened with checkambig=True at
                  writing, to avoid file stat ambiguity.
                  If mmaplargeindex is True, and an mmapindexthreshold is set, the
                  index will be mmapped rather than read if it is larger than the
                  configured threshold.
                  If censorable is True, the revlog can have censored revisions.
                  """
                  def __init__(self, opener, indexfile, datafile=None, checkambig=False,
                               mmaplargeindex=False, censorable=False):
                      """
                      create a revlog object
                      opener is a function that abstracts the file opening operation
                      and can be used to implement COW semantics or the like.
                      """
                      self.indexfile = indexfile
                      self.datafile = datafile or (indexfile[:-2] + ".d")
                      self.opener = opener
                      #  When True, indexfile is opened with checkambig=True at writing, to
                      #  avoid file stat ambiguity.
                      self._checkambig = checkambig
                      self._censorable = censorable
                      # 3-tuple of (node, rev, text) for a raw revision.
                      self._cache = None
                      # Maps rev to chain base rev.
                      self._chainbasecache = util.lrucachedict(100)
                      # 2-tuple of (offset, data) of raw data from the revlog at an offset.
                      self._chunkcache = (0, '')
                      # How much data to read and cache into the raw revlog data cache.
                      self._chunkcachesize = 65536
                      self._maxchainlen = None
                      self._deltabothparents = True
                      self.index = []
                      # Mapping of partial identifiers to full nodes.
                      self._pcache = {}
                      # Mapping of revision integer to full node.
                      self._nodecache = {nullid: nullrev}
                      self._nodepos = None
                      self._compengine = 'zlib'
                      self._maxdeltachainspan = -1
                      self._withsparseread = False
                      self._sparserevlog = False
                      self._srdensitythreshold = 0.50
                      self._srmingapsize = 262144
                      mmapindexthreshold = None
                      v = REVLOG_DEFAULT_VERSION
                      opts = getattr(opener, 'options', None)
                      if opts is not None:
                          if 'revlogv2' in opts:
                              # version 2 revlogs always use generaldelta.
                              v = REVLOGV2 | FLAG_GENERALDELTA | FLAG_INLINE_DATA
                          elif 'revlogv1' in opts:
                              if 'generaldelta' in opts:
                                  v |= FLAG_GENERALDELTA
                          else:
                              v = 0
                          if 'chunkcachesize' in opts:
                              self._chunkcachesize = opts['chunkcachesize']
                          if 'maxchainlen' in opts:
                              self._maxchainlen = opts['maxchainlen']
                          if 'deltabothparents' in opts:
                              self._deltabothparents = opts['deltabothparents']
                          self._lazydeltabase = bool(opts.get('lazydeltabase', False))
                          if 'compengine' in opts:
                              self._compengine = opts['compengine']
                          if 'maxdeltachainspan' in opts:
                              self._maxdeltachainspan = opts['maxdeltachainspan']
                          if mmaplargeindex and 'mmapindexthreshold' in opts:
                              mmapindexthreshold = opts['mmapindexthreshold']
                          self._sparserevlog = bool(opts.get('sparse-revlog', False))
                          withsparseread = bool(opts.get('with-sparse-read', False))
                          # sparse-revlog forces sparse-read
                          self._withsparseread = self._sparserevlog or withsparseread
                          if 'sparse-read-density-threshold' in opts:
                              self._srdensitythreshold = opts['sparse-read-density-threshold']
                          if 'sparse-read-min-gap-size' in opts:
                              self._srmingapsize = opts['sparse-read-min-gap-size']
                      if self._chunkcachesize <= 0:
                          raise RevlogError(_('revlog chunk cache size %r is not greater '
                                              'than 0') % self._chunkcachesize)
                      elif self._chunkcachesize & (self._chunkcachesize - 1):
                          raise RevlogError(_('revlog chunk cache size %r is not a power '
                                              'of 2') % self._chunkcachesize)
                      indexdata = ''
                      self._initempty = True
                      try:
                          with self._indexfp() as f:
                              if (mmapindexthreshold is not None and
                                      self.opener.fstat(f).st_size >= mmapindexthreshold):
                                  indexdata = util.buffer(util.mmapread(f))
                              else:
                                  indexdata = f.read()
                          if len(indexdata) > 0:
                              v = versionformat_unpack(indexdata[:4])[0]
                              self._initempty = False
                      except IOError as inst:
                          if inst.errno != errno.ENOENT:
                              raise
                      self.version = v
                      self._inline = v & FLAG_INLINE_DATA
                      self._generaldelta = v & FLAG_GENERALDELTA
                      flags = v & ~0xFFFF
                      fmt = v & 0xFFFF
                      if fmt == REVLOGV0:
                          if flags:
                              raise RevlogError(_('unknown flags (%#04x) in version %d '
                                                  'revlog %s') %
                                                (flags >> 16, fmt, self.indexfile))
                      elif fmt == REVLOGV1:
                          if flags & ~REVLOGV1_FLAGS:
                              raise RevlogError(_('unknown flags (%#04x) in version %d '
                                                  'revlog %s') %
                                                (flags >> 16, fmt, self.indexfile))
                      elif fmt == REVLOGV2:
                          if flags & ~REVLOGV2_FLAGS:
                              raise RevlogError(_('unknown flags (%#04x) in version %d '
                                                  'revlog %s') %
                                                (flags >> 16, fmt, self.indexfile))
                      else:
                          raise RevlogError(_('unknown version (%d) in revlog %s') %
                                            (fmt, self.indexfile))
                      self._storedeltachains = True
                      self._io = revlogio()
                      if self.version == REVLOGV0:
                          self._io = revlogoldio()
                      try:
                          d = self._io.parseindex(indexdata, self._inline)
                      except (ValueError, IndexError):
                          raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                      self.index, nodemap, self._chunkcache = d
                      if nodemap is not None:
                          self.nodemap = self._nodecache = nodemap
                      if not self._chunkcache:
                          self._chunkclear()
                      # revnum -> (chain-length, sum-delta-length)
                      self._chaininfocache = {}
                      # revlog header -> revlog compressor
                      self._decompressors = {}
                  @util.propertycache
                  def _compressor(self):
                      return util.compengines[self._compengine].revlogcompressor()
                  def _indexfp(self, mode='r'):
                      """file object for the revlog's index file"""
                      args = {r'mode': mode}
                      if mode != 'r':
                          args[r'checkambig'] = self._checkambig
                      if mode == 'w':
                          args[r'atomictemp'] = True
                      return self.opener(self.indexfile, **args)
                  def _datafp(self, mode='r'):
                      """file object for the revlog's data file"""
                      return self.opener(self.datafile, mode=mode)
                  @contextlib.contextmanager
                  def _datareadfp(self, existingfp=None):
                      """file object suitable to read data"""
                      if existingfp is not None:
                          yield existingfp
                      else:
                          if self._inline:
                              func = self._indexfp
                          else:
                              func = self._datafp
                          with func() as fp:
                              yield fp
                  def tip(self):
                      return self.node(len(self.index) - 1)
                  def __contains__(self, rev):
                      return 0 <= rev < len(self)
                  def __len__(self):
                      return len(self.index)
                  def __iter__(self):
                      return iter(pycompat.xrange(len(self)))
                  def revs(self, start=0, stop=None):
                      """iterate over all rev in this revlog (from start to stop)"""
                      step = 1
                      length = len(self)
                      if stop is not None:
                          if start > stop:
                              step = -1
                          stop += step
                          if stop > length:
                              stop = length
                      else:
                          stop = length
                      return pycompat.xrange(start, stop, step)
                  @util.propertycache
                  def nodemap(self):
                      if self.index:
                          # populate mapping down to the initial node
                          node0 = self.index[0][7]  # get around changelog filtering
                          self.rev(node0)
                      return self._nodecache
                  def hasnode(self, node):
                      try:
                          self.rev(node)
                          return True
                      except KeyError:
                          return False
                  def candelta(self, baserev, rev):
                      """whether two revisions (baserev, rev) can be delta-ed or not"""
                      # Disable delta if either rev requires a content-changing flag
                      # processor (ex. LFS). This is because such flag processor can alter
                      # the rawtext content that the delta will be based on, and two clients
                      # could have a same revlog node with different flags (i.e. different
                      # rawtext contents) and the delta could be incompatible.
                      if ((self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS)
                          or (self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS)):
                          return False
                      return True
                  def clearcaches(self):
                      self._cache = None
                      self._chainbasecache.clear()
                      self._chunkcache = (0, '')
                      self._pcache = {}
                      try:
                          self._nodecache.clearcaches()
                      except AttributeError:
                          self._nodecache = {nullid: nullrev}
                          self._nodepos = None
                  def rev(self, node):
                      try:
                          return self._nodecache[node]
                      except TypeError:
                          raise
                      except RevlogError:
                          # parsers.c radix tree lookup failed
                          if node == wdirid or node in wdirfilenodeids:
                              raise error.WdirUnsupported
                          raise LookupError(node, self.indexfile, _('no node'))
                      except KeyError:
                          # pure python cache lookup failed
                          n = self._nodecache
                          i = self.index
                          p = self._nodepos
                          if p is None:
                              p = len(i) - 1
                          else:
                              assert p < len(i)
                          for r in pycompat.xrange(p, -1, -1):
                              v = i[r][7]
                              n[v] = r
                              if v == node:
                                  self._nodepos = r - 1
                                  return r
                          if node == wdirid or node in wdirfilenodeids:
                              raise error.WdirUnsupported
                          raise LookupError(node, self.indexfile, _('no node'))
                  # Accessors for index entries.
                  # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                  # are flags.
                  def start(self, rev):
                      return int(self.index[rev][0] >> 16)
                  def flags(self, rev):
                      return self.index[rev][0] & 0xFFFF
                  def length(self, rev):
                      return self.index[rev][1]
                  def rawsize(self, rev):
                      """return the length of the uncompressed text for a given revision"""
                      l = self.index[rev][2]
                      if l >= 0:
                          return l
                      t = self.revision(rev, raw=True)
                      return len(t)
                  def size(self, rev):
                      """length of non-raw text (processed by a "read" flag processor)"""
                      # fast path: if no "read" flag processor could change the content,
                      # size is rawsize. note: ELLIPSIS is known to not change the content.
                      flags = self.flags(rev)
                      if flags & (REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                          return self.rawsize(rev)
                      return len(self.revision(rev, raw=False))
                  def chainbase(self, rev):
                      base = self._chainbasecache.get(rev)
                      if base is not None:
                          return base
                      index = self.index
                      iterrev = rev
                      base = index[iterrev][3]
                      while base != iterrev:
                          iterrev = base
                          base = index[iterrev][3]
                      self._chainbasecache[rev] = base
                      return base
                  def linkrev(self, rev):
                      return self.index[rev][4]
                  def parentrevs(self, rev):
                      try:
                          entry = self.index[rev]
                      except IndexError:
                          if rev == wdirrev:
                              raise error.WdirUnsupported
                          raise
                      return entry[5], entry[6]
                  def node(self, rev):
                      try:
                          return self.index[rev][7]
                      except IndexError:
                          if rev == wdirrev:
                              raise error.WdirUnsupported
                          raise
                  # Derived from index values.
                  def end(self, rev):
                      return self.start(rev) + self.length(rev)
                  def parents(self, node):
                      i = self.index
                      d = i[self.rev(node)]
                      return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                  def chainlen(self, rev):
                      return self._chaininfo(rev)[0]
                  def _chaininfo(self, rev):
                      chaininfocache = self._chaininfocache
                      if rev in chaininfocache:
                          return chaininfocache[rev]
                      index = self.index
                      generaldelta = self._generaldelta
                      iterrev = rev
                      e = index[iterrev]
                      clen = 0
                      compresseddeltalen = 0
                      while iterrev != e[3]:
                          clen += 1
                          compresseddeltalen += e[1]
                          if generaldelta:
                              iterrev = e[3]
                          else:
                              iterrev -= 1
                          if iterrev in chaininfocache:
                              t = chaininfocache[iterrev]
                              clen += t[0]
                              compresseddeltalen += t[1]
                              break
                          e = index[iterrev]
                      else:
                          # Add text length of base since decompressing that also takes
                          # work. For cache hits the length is already included.
                          compresseddeltalen += e[1]
                      r = (clen, compresseddeltalen)
                      chaininfocache[rev] = r
                      return r
                  def _deltachain(self, rev, stoprev=None):
                      """Obtain the delta chain for a revision.
                      ``stoprev`` specifies a revision to stop at. If not specified, we
                      stop at the base of the chain.
                      Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                      revs in ascending order and ``stopped`` is a bool indicating whether
                      ``stoprev`` was hit.
                      """
                      # Try C implementation.
                      try:
                          return self.index.deltachain(rev, stoprev, self._generaldelta)
                      except AttributeError:
                          pass
                      chain = []
                      # Alias to prevent attribute lookup in tight loop.
                      index = self.index
                      generaldelta = self._generaldelta
                      iterrev = rev
                      e = index[iterrev]
                      while iterrev != e[3] and iterrev != stoprev:
                          chain.append(iterrev)
                          if generaldelta:
                              iterrev = e[3]
                          else:
                              iterrev -= 1
                          e = index[iterrev]
                      if iterrev == stoprev:
                          stopped = True
                      else:
                          chain.append(iterrev)
                          stopped = False
                      chain.reverse()
                      return chain, stopped
                  def ancestors(self, revs, stoprev=0, inclusive=False):
                      """Generate the ancestors of 'revs' in reverse topological order.
                      Does not generate revs lower than stoprev.
                      See the documentation for ancestor.lazyancestors for more details."""
                      return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,
                                                    inclusive=inclusive)
                  def descendants(self, revs):
                      """Generate the descendants of 'revs' in revision order.
                      Yield a sequence of revision numbers starting with a child of
                      some rev in revs, i.e., each revision is *not* considered a
                      descendant of itself.  Results are ordered by revision number (a
                      topological sort)."""
                      first = min(revs)
                      if first == nullrev:
                          for i in self:
                              yield i
                          return
                      seen = set(revs)
                      for i in self.revs(start=first + 1):
                          for x in self.parentrevs(i):
                              if x != nullrev and x in seen:
                                  seen.add(i)
                                  yield i
                                  break
                  def findcommonmissing(self, common=None, heads=None):
                      """Return a tuple of the ancestors of common and the ancestors of heads
                      that are not ancestors of common. In revset terminology, we return the
                      tuple:
                        ::common, (::heads) - (::common)
                      The list is sorted by revision number, meaning it is
                      topologically sorted.
                      'heads' and 'common' are both lists of node IDs.  If heads is
                      not supplied, uses all of the revlog's heads.  If common is not
                      supplied, uses nullid."""
                      if common is None:
                          common = [nullid]
                      if heads is None:
                          heads = self.heads()
                      common = [self.rev(n) for n in common]
                      heads = [self.rev(n) for n in heads]
                      # we want the ancestors, but inclusive
                      class lazyset(object):
                          def __init__(self, lazyvalues):
                              self.addedvalues = set()
                              self.lazyvalues = lazyvalues
                          def __contains__(self, value):
                              return value in self.addedvalues or value in self.lazyvalues
                          def __iter__(self):
                              added = self.addedvalues
                              for r in added:
                                  yield r
                              for r in self.lazyvalues:
                                  if not r in added:
                                      yield r
                          def add(self, value):
                              self.addedvalues.add(value)
                          def update(self, values):
                              self.addedvalues.update(values)
                      has = lazyset(self.ancestors(common))
                      has.add(nullrev)
                      has.update(common)
                      # take all ancestors from heads that aren't in has
                      missing = set()
                      visit = collections.deque(r for r in heads if r not in has)
                      while visit:
                          r = visit.popleft()
                          if r in missing:
                              continue
                          else:
                              missing.add(r)
                              for p in self.parentrevs(r):
                                  if p not in has:
                                      visit.append(p)
                      missing = list(missing)
                      missing.sort()
                      return has, [self.node(miss) for miss in missing]
                  def incrementalmissingrevs(self, common=None):
                      """Return an object that can be used to incrementally compute the
                      revision numbers of the ancestors of arbitrary sets that are not
                      ancestors of common. This is an ancestor.incrementalmissingancestors
                      object.
                      'common' is a list of revision numbers. If common is not supplied, uses
                      nullrev.
                      """
                      if common is None:
                          common = [nullrev]
                      return ancestor.incrementalmissingancestors(self.parentrevs, common)
                  def findmissingrevs(self, common=None, heads=None):
                      """Return the revision numbers of the ancestors of heads that
                      are not ancestors of common.
                      More specifically, return a list of revision numbers corresponding to
                      nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                      The list is sorted by revision number, meaning it is
                      topologically sorted.
                      'heads' and 'common' are both lists of revision numbers.  If heads is
                      not supplied, uses all of the revlog's heads.  If common is not
                      supplied, uses nullid."""
                      if common is None:
                          common = [nullrev]
                      if heads is None:
                          heads = self.headrevs()
                      inc = self.incrementalmissingrevs(common=common)
                      return inc.missingancestors(heads)
                  def findmissing(self, common=None, heads=None):
                      """Return the ancestors of heads that are not ancestors of common.
                      More specifically, return a list of nodes N such that every N
                      satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                      The list is sorted by revision number, meaning it is
                      topologically sorted.
                      'heads' and 'common' are both lists of node IDs.  If heads is
                      not supplied, uses all of the revlog's heads.  If common is not
                      supplied, uses nullid."""
                      if common is None:
                          common = [nullid]
                      if heads is None:
                          heads = self.heads()
                      common = [self.rev(n) for n in common]
                      heads = [self.rev(n) for n in heads]
                      inc = self.incrementalmissingrevs(common=common)
                      return [self.node(r) for r in inc.missingancestors(heads)]
                  def nodesbetween(self, roots=None, heads=None):
                      """Return a topological path from 'roots' to 'heads'.
                      Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                      topologically sorted list of all nodes N that satisfy both of
                      these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                      Every node is considered to be both a descendant and an ancestor
                      of itself, so every reachable node in 'roots' and 'heads' will be
                      included in 'nodes'.
                      'outroots' is the list of reachable nodes in 'roots', i.e., the
                      subset of 'roots' that is returned in 'nodes'.  Likewise,
                      'outheads' is the subset of 'heads' that is also in 'nodes'.
                      'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                      unspecified, uses nullid as the only root.  If 'heads' is
                      unspecified, uses list of all of the revlog's heads."""
                      nonodes = ([], [], [])
                      if roots is not None:
                          roots = list(roots)
                          if not roots:
                              return nonodes
                          lowestrev = min([self.rev(n) for n in roots])
                      else:
                          roots = [nullid] # Everybody's a descendant of nullid
                          lowestrev = nullrev
                      if (lowestrev == nullrev) and (heads is None):
                          # We want _all_ the nodes!
                          return ([self.node(r) for r in self], [nullid], list(self.heads()))
                      if heads is None:
                          # All nodes are ancestors, so the latest ancestor is the last
                          # node.
                          highestrev = len(self) - 1
                          # Set ancestors to None to signal that every node is an ancestor.
                          ancestors = None
                          # Set heads to an empty dictionary for later discovery of heads
                          heads = {}
                      else:
                          heads = list(heads)
                          if not heads:
                              return nonodes
                          ancestors = set()
                          # Turn heads into a dictionary so we can remove 'fake' heads.
                          # Also, later we will be using it to filter out the heads we can't
                          # find from roots.
                          heads = dict.fromkeys(heads, False)
                          # Start at the top and keep marking parents until we're done.
                          nodestotag = set(heads)
                          # Remember where the top was so we can use it as a limit later.
                          highestrev = max([self.rev(n) for n in nodestotag])
                          while nodestotag:
                              # grab a node to tag
                              n = nodestotag.pop()
                              # Never tag nullid
                              if n == nullid:
                                  continue
                              # A node's revision number represents its place in a
                              # topologically sorted list of nodes.
                              r = self.rev(n)
                              if r >= lowestrev:
                                  if n not in ancestors:
                                      # If we are possibly a descendant of one of the roots
                                      # and we haven't already been marked as an ancestor
                                      ancestors.add(n) # Mark as ancestor
                                      # Add non-nullid parents to list of nodes to tag.
                                      nodestotag.update([p for p in self.parents(n) if
                                                         p != nullid])
                                  elif n in heads: # We've seen it before, is it a fake head?
                                      # So it is, real heads should not be the ancestors of
                                      # any other heads.
                                      heads.pop(n)
                          if not ancestors:
                              return nonodes
                          # Now that we have our set of ancestors, we want to remove any
                          # roots that are not ancestors.
                          # If one of the roots was nullid, everything is included anyway.
                          if lowestrev > nullrev:
                              # But, since we weren't, let's recompute the lowest rev to not
                              # include roots that aren't ancestors.
                              # Filter out roots that aren't ancestors of heads
                              roots = [root for root in roots if root in ancestors]
                              # Recompute the lowest revision
                              if roots:
                                  lowestrev = min([self.rev(root) for root in roots])
                              else:
                                  # No more roots?  Return empty list
                                  return nonodes
                          else:
                              # We are descending from nullid, and don't need to care about
                              # any other roots.
                              lowestrev = nullrev
                              roots = [nullid]
                      # Transform our roots list into a set.
                      descendants = set(roots)
                      # Also, keep the original roots so we can filter out roots that aren't
                      # 'real' roots (i.e. are descended from other roots).
                      roots = descendants.copy()
                      # Our topologically sorted list of output nodes.
                      orderedout = []
                      # Don't start at nullid since we don't want nullid in our output list,
                      # and if nullid shows up in descendants, empty parents will look like
                      # they're descendants.
                      for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                          n = self.node(r)
                          isdescendant = False
                          if lowestrev == nullrev:  # Everybody is a descendant of nullid
                              isdescendant = True
                          elif n in descendants:
                              # n is already a descendant
                              isdescendant = True
                              # This check only needs to be done here because all the roots
                              # will start being marked is descendants before the loop.
                              if n in roots:
                                  # If n was a root, check if it's a 'real' root.
                                  p = tuple(self.parents(n))
                                  # If any of its parents are descendants, it's not a root.
                                  if (p[0] in descendants) or (p[1] in descendants):
                                      roots.remove(n)
                          else:
                              p = tuple(self.parents(n))
                              # A node is a descendant if either of its parents are
                              # descendants.  (We seeded the dependents list with the roots
                              # up there, remember?)
                              if (p[0] in descendants) or (p[1] in descendants):
                                  descendants.add(n)
                                  isdescendant = True
                          if isdescendant and ((ancestors is None) or (n in ancestors)):
                              # Only include nodes that are both descendants and ancestors.
                              orderedout.append(n)
                              if (ancestors is not None) and (n in heads):
                                  # We're trying to figure out which heads are reachable
                                  # from roots.
                                  # Mark this head as having been reached
                                  heads[n] = True
                              elif ancestors is None:
                                  # Otherwise, we're trying to discover the heads.
                                  # Assume this is a head because if it isn't, the next step
                                  # will eventually remove it.
                                  heads[n] = True
                                  # But, obviously its parents aren't.
                                  for p in self.parents(n):
                                      heads.pop(p, None)
                      heads = [head for head, flag in heads.iteritems() if flag]
                      roots = list(roots)
                      assert orderedout
                      assert roots
                      assert heads
                      return (orderedout, roots, heads)
                  def headrevs(self):
                      try:
                          return self.index.headrevs()
                      except AttributeError:
                          return self._headrevs()
                  def computephases(self, roots):
                      return self.index.computephasesmapsets(roots)
                  def _headrevs(self):
                      count = len(self)
                      if not count:
                          return [nullrev]
                      # we won't iter over filtered rev so nobody is a head at start
                      ishead = [0] * (count + 1)
                      index = self.index
                      for r in self:
                          ishead[r] = 1  # I may be an head
                          e = index[r]
                          ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                      return [r for r, val in enumerate(ishead) if val]
                  def heads(self, start=None, stop=None):
                      """return the list of all nodes that have no children
                      if start is specified, only heads that are descendants of
                      start will be returned
                      if stop is specified, it will consider all the revs from stop
                      as if they had no children
                      """
                      if start is None and stop is None:
                          if not len(self):
                              return [nullid]
                          return [self.node(r) for r in self.headrevs()]
                      if start is None:
                          start = nullid
                      if stop is None:
                          stop = []
                      stoprevs = set([self.rev(n) for n in stop])
                      startrev = self.rev(start)
                      reachable = {startrev}
                      heads = {startrev}
                      parentrevs = self.parentrevs
                      for r in self.revs(start=startrev + 1):
                          for p in parentrevs(r):
                              if p in reachable:
                                  if r not in stoprevs:
                                      reachable.add(r)
                                  heads.add(r)
                              if p in heads and p not in stoprevs:
                                  heads.remove(p)
                      return [self.node(r) for r in heads]
                  def children(self, node):
                      """find the children of a given node"""
                      c = []
                      p = self.rev(node)
                      for r in self.revs(start=p + 1):
                          prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                          if prevs:
                              for pr in prevs:
                                  if pr == p:
                                      c.append(self.node(r))
                          elif p == nullrev:
                              c.append(self.node(r))
                      return c
                  def commonancestorsheads(self, a, b):
                      """calculate all the heads of the common ancestors of nodes a and b"""
                      a, b = self.rev(a), self.rev(b)
                      ancs = self._commonancestorsheads(a, b)
                      return pycompat.maplist(self.node, ancs)
                  def _commonancestorsheads(self, *revs):
                      """calculate all the heads of the common ancestors of revs"""
                      try:
                          ancs = self.index.commonancestorsheads(*revs)
                      except (AttributeError, OverflowError): # C implementation failed
                          ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                      return ancs
                  def isancestor(self, a, b):
                      """return True if node a is an ancestor of node b
                      A revision is considered an ancestor of itself."""
                      a, b = self.rev(a), self.rev(b)
                      return self.isancestorrev(a, b)
                  def isancestorrev(self, a, b):
                      """return True if revision a is an ancestor of revision b
                      A revision is considered an ancestor of itself.
                      The implementation of this is trivial but the use of
                      commonancestorsheads is not."""
                      if a == nullrev:
                          return True
                      elif a == b:
                          return True
                      elif a > b:
                          return False
                      return a in self._commonancestorsheads(a, b)
                  def ancestor(self, a, b):
                      """calculate the "best" common ancestor of nodes a and b"""
                      a, b = self.rev(a), self.rev(b)
                      try:
                          ancs = self.index.ancestors(a, b)
                      except (AttributeError, OverflowError):
                          ancs = ancestor.ancestors(self.parentrevs, a, b)
                      if ancs:
                          # choose a consistent winner when there's a tie
                          return min(map(self.node, ancs))
                      return nullid
                  def _match(self, id):
                      if isinstance(id, int):
                          # rev
                          return self.node(id)
                      if len(id) == 20:
                          # possibly a binary node
                          # odds of a binary node being all hex in ASCII are 1 in 10**25
                          try:
                              node = id
                              self.rev(node) # quick search the index
                              return node
                          except LookupError:
                              pass # may be partial hex id
                      try:
                          # str(rev)
                          rev = int(id)
                          if "%d" % rev != id:
                              raise ValueError
                          if rev < 0:
                              rev = len(self) + rev
                          if rev < 0 or rev >= len(self):
                              raise ValueError
                          return self.node(rev)
                      except (ValueError, OverflowError):
                          pass
                      if len(id) == 40:
                          try:
                              # a full hex nodeid?
                              node = bin(id)
                              self.rev(node)
                              return node
                          except (TypeError, LookupError):
                              pass
                  def _partialmatch(self, id):
                      # we don't care wdirfilenodeids as they should be always full hash
                      maybewdir = wdirhex.startswith(id)
                      try:
                          partial = self.index.partialmatch(id)
                          if partial and self.hasnode(partial):
                              if maybewdir:
                                  # single 'ff...' match in radix tree, ambiguous with wdir
                                  raise RevlogError
                              return partial
                          if maybewdir:
                              # no 'ff...' match in radix tree, wdir identified
                              raise error.WdirUnsupported
                          return None
                      except RevlogError:
                          # parsers.c radix tree lookup gave multiple matches
                          # fast path: for unfiltered changelog, radix tree is accurate
                          if not getattr(self, 'filteredrevs', None):
                              raise AmbiguousPrefixLookupError(id, self.indexfile,
                                                               _('ambiguous identifier'))
                          # fall through to slow path that filters hidden revisions
                      except (AttributeError, ValueError):
                          # we are pure python, or key was too short to search radix tree
                          pass
                      if id in self._pcache:
                          return self._pcache[id]
                      if len(id) <= 40:
                          try:
                              # hex(node)[:...]
                              l = len(id) // 2  # grab an even number of digits
                              prefix = bin(id[:l * 2])
                              nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                              nl = [n for n in nl if hex(n).startswith(id) and
                                    self.hasnode(n)]
                              if nullhex.startswith(id):
                                  nl.append(nullid)
                              if len(nl) > 0:
                                  if len(nl) == 1 and not maybewdir:
                                      self._pcache[id] = nl[0]
                                      return nl[0]
                                  raise AmbiguousPrefixLookupError(id, self.indexfile,
                                                                   _('ambiguous identifier'))
                              if maybewdir:
                                  raise error.WdirUnsupported
                              return None
                          except TypeError:
                              pass
                  def lookup(self, id):
                      """locate a node based on:
                          - revision number or str(revision number)
                          - nodeid or subset of hex nodeid
                      """
                      n = self._match(id)
                      if n is not None:
                          return n
                      n = self._partialmatch(id)
                      if n:
                          return n
                      raise LookupError(id, self.indexfile, _('no match found'))
                  def shortest(self, node, minlength=1):
                      """Find the shortest unambiguous prefix that matches node."""
                      def isvalid(prefix):
                          try:
                              node = self._partialmatch(prefix)
                          except error.RevlogError:
                              return False
                          except error.WdirUnsupported:
                              # single 'ff...' match
                              return True
                          if node is None:
                              raise LookupError(node, self.indexfile, _('no node'))
                          return True
                      def maybewdir(prefix):
                          return all(c == 'f' for c in prefix)
                      hexnode = hex(node)
                      def disambiguate(hexnode, minlength):
                          """Disambiguate against wdirid."""
                          for length in range(minlength, 41):
                              prefix = hexnode[:length]
                              if not maybewdir(prefix):
                                  return prefix
                      if not getattr(self, 'filteredrevs', None):
                          try:
                              length = max(self.index.shortest(node), minlength)
                              return disambiguate(hexnode, length)
                          except RevlogError:
                              if node != wdirid:
                                  raise LookupError(node, self.indexfile, _('no node'))
                          except AttributeError:
                              # Fall through to pure code
                              pass
                      if node == wdirid:
                          for length in range(minlength, 41):
                              prefix = hexnode[:length]
                              if isvalid(prefix):
                                  return prefix
                      for length in range(minlength, 41):
                          prefix = hexnode[:length]
                          if isvalid(prefix):
                              return disambiguate(hexnode, length)
                  def cmp(self, node, text):
                      """compare text with a given file revision
                      returns True if text is different than what is stored.
                      """
                      p1, p2 = self.parents(node)
                      return hash(text, p1, p2) != node
                  def _cachesegment(self, offset, data):
                      """Add a segment to the revlog cache.
                      Accepts an absolute offset and the data that is at that location.
                      """
                      o, d = self._chunkcache
                      # try to add to existing cache
                      if o + len(d) == offset and len(d) + len(data) < _chunksize:
                          self._chunkcache = o, d + data
                      else:
                          self._chunkcache = offset, data
                  def _readsegment(self, offset, length, df=None):
                      """Load a segment of raw data from the revlog.
                      Accepts an absolute offset, length to read, and an optional existing
                      file handle to read from.
                      If an existing file handle is passed, it will be seeked and the
                      original seek position will NOT be restored.
                      Returns a str or buffer of raw byte data.
                      """
                      # Cache data both forward and backward around the requested
                      # data, in a fixed size window. This helps speed up operations
                      # involving reading the revlog backwards.
                      cachesize = self._chunkcachesize
                      realoffset = offset & ~(cachesize - 1)
                      reallength = (((offset + length + cachesize) & ~(cachesize - 1))
                                    - realoffset)
                      with self._datareadfp(df) as df:
                          df.seek(realoffset)
                          d = df.read(reallength)
                      self._cachesegment(realoffset, d)
                      if offset != realoffset or reallength != length:
                          return util.buffer(d, offset - realoffset, length)
                      return d
                  def _getsegment(self, offset, length, df=None):
                      """Obtain a segment of raw data from the revlog.
                      Accepts an absolute offset, length of bytes to obtain, and an
                      optional file handle to the already-opened revlog. If the file
                      handle is used, it's original seek position will not be preserved.
                      Requests for data may be returned from a cache.
                      Returns a str or a buffer instance of raw byte data.
                      """
                      o, d = self._chunkcache
                      l = len(d)
                      # is it in the cache?
                      cachestart = offset - o
                      cacheend = cachestart + length
                      if cachestart >= 0 and cacheend <= l:
                          if cachestart == 0 and cacheend == l:
                              return d # avoid a copy
                          return util.buffer(d, cachestart, cacheend - cachestart)
                      return self._readsegment(offset, length, df=df)
                  def _getsegmentforrevs(self, startrev, endrev, df=None):
                      """Obtain a segment of raw data corresponding to a range of revisions.
                      Accepts the start and end revisions and an optional already-open
                      file handle to be used for reading. If the file handle is read, its
                      seek position will not be preserved.
                      Requests for data may be satisfied by a cache.
                      Returns a 2-tuple of (offset, data) for the requested range of
                      revisions. Offset is the integer offset from the beginning of the
                      revlog and data is a str or buffer of the raw byte data.
                      Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                      to determine where each revision's data begins and ends.
                      """
                      # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                      # (functions are expensive).
                      index = self.index
                      istart = index[startrev]
                      start = int(istart[0] >> 16)
                      if startrev == endrev:
                          end = start + istart[1]
                      else:
                          iend = index[endrev]
                          end = int(iend[0] >> 16) + iend[1]
                      if self._inline:
                          start += (startrev + 1) * self._io.size
                          end += (endrev + 1) * self._io.size
                      length = end - start
                      return start, self._getsegment(start, length, df=df)
                  def _chunk(self, rev, df=None):
                      """Obtain a single decompressed chunk for a revision.
                      Accepts an integer revision and an optional already-open file handle
                      to be used for reading. If used, the seek position of the file will not
                      be preserved.
                      Returns a str holding uncompressed data for the requested revision.
                      """
                      return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])
                  def _chunks(self, revs, df=None, targetsize=None):
                      """Obtain decompressed chunks for the specified revisions.
                      Accepts an iterable of numeric revisions that are assumed to be in
                      ascending order. Also accepts an optional already-open file handle
                      to be used for reading. If used, the seek position of the file will
                      not be preserved.
                      This function is similar to calling ``self._chunk()`` multiple times,
                      but is faster.
                      Returns a list with decompressed data for each requested revision.
                      """
                      if not revs:
                          return []
                      start = self.start
                      length = self.length
                      inline = self._inline
                      iosize = self._io.size
                      buffer = util.buffer
                      l = []
                      ladd = l.append
                      if not self._withsparseread:
                          slicedchunks = (revs,)
                      else:
-                         slicedchunks = _slicechunk(self, revs, targetsize=targetsize)
+                         slicedchunks = deltautil.slicechunk(self, revs,
+                                                             targetsize=targetsize)
                      for revschunk in slicedchunks:
                          firstrev = revschunk[0]
                          # Skip trailing revisions with empty diff
                          for lastrev in revschunk[::-1]:
                              if length(lastrev) != 0:
                                  break
                          try:
                              offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)
                          except OverflowError:
                              # issue4215 - we can't cache a run of chunks greater than
                              # 2G on Windows
                              return [self._chunk(rev, df=df) for rev in revschunk]
                          decomp = self.decompress
                          for rev in revschunk:
                              chunkstart = start(rev)
                              if inline:
                                  chunkstart += (rev + 1) * iosize
                              chunklength = length(rev)
                              ladd(decomp(buffer(data, chunkstart - offset, chunklength)))
                      return l
                  def _chunkclear(self):
                      """Clear the raw chunk cache."""
                      self._chunkcache = (0, '')
                  def deltaparent(self, rev):
                      """return deltaparent of the given revision"""
                      base = self.index[rev][3]
                      if base == rev:
                          return nullrev
                      elif self._generaldelta:
                          return base
                      else:
                          return rev - 1
                  def issnapshot(self, rev):
                      """tells whether rev is a snapshot
                      """
                      if rev == nullrev:
                          return True
                      deltap = self.deltaparent(rev)
                      if deltap == nullrev:
                          return True
                      p1, p2 = self.parentrevs(rev)
                      if deltap in (p1, p2):
                          return False
                      return self.issnapshot(deltap)
                  def snapshotdepth(self, rev):
                      """number of snapshot in the chain before this one"""
                      if not self.issnapshot(rev):
                          raise ProgrammingError('revision %d not a snapshot')
                      return len(self._deltachain(rev)[0]) - 1
                  def revdiff(self, rev1, rev2):
                      """return or calculate a delta between two revisions
                      The delta calculated is in binary form and is intended to be written to
                      revlog data directly. So this function needs raw revision data.
                      """
                      if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                          return bytes(self._chunk(rev2))
                      return mdiff.textdiff(self.revision(rev1, raw=True),
                                            self.revision(rev2, raw=True))
                  def revision(self, nodeorrev, _df=None, raw=False):
                      """return an uncompressed revision of a given node or revision
                      number.
                      _df - an existing file handle to read from. (internal-only)
                      raw - an optional argument specifying if the revision data is to be
                      treated as raw data when applying flag transforms. 'raw' should be set
                      to True when generating changegroups or in debug commands.
                      """
                      if isinstance(nodeorrev, int):
                          rev = nodeorrev
                          node = self.node(rev)
                      else:
                          node = nodeorrev
                          rev = None
                      cachedrev = None
                      flags = None
                      rawtext = None
                      if node == nullid:
                          return ""
                      if self._cache:
                          if self._cache[0] == node:
                              # _cache only stores rawtext
                              if raw:
                                  return self._cache[2]
                              # duplicated, but good for perf
                              if rev is None:
                                  rev = self.rev(node)
                              if flags is None:
                                  flags = self.flags(rev)
                              # no extra flags set, no flag processor runs, text = rawtext
                              if flags == REVIDX_DEFAULT_FLAGS:
                                  return self._cache[2]
                              # rawtext is reusable. need to run flag processor
                              rawtext = self._cache[2]
                          cachedrev = self._cache[1]
                      # look up what we need to read
                      if rawtext is None:
                          if rev is None:
                              rev = self.rev(node)
                          chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                          if stopped:
                              rawtext = self._cache[2]
                          # drop cache to save memory
                          self._cache = None
                          targetsize = None
                          rawsize = self.index[rev][2]
                          if 0 <= rawsize:
                              targetsize = 4 * rawsize
                          bins = self._chunks(chain, df=_df, targetsize=targetsize)
                          if rawtext is None:
                              rawtext = bytes(bins[0])
                              bins = bins[1:]
                          rawtext = mdiff.patches(rawtext, bins)
                          self._cache = (node, rev, rawtext)
                      if flags is None:
                          if rev is None:
                              rev = self.rev(node)
                          flags = self.flags(rev)
                      text, validatehash = self._processflags(rawtext, flags, 'read', raw=raw)
                      if validatehash:
                          self.checkhash(text, node, rev=rev)
                      return text
                  def hash(self, text, p1, p2):
                      """Compute a node hash.
                      Available as a function so that subclasses can replace the hash
                      as needed.
                      """
                      return hash(text, p1, p2)
                  def _processflags(self, text, flags, operation, raw=False):
                      """Inspect revision data flags and applies transforms defined by
                      registered flag processors.
                      ``text`` - the revision data to process
                      ``flags`` - the revision flags
                      ``operation`` - the operation being performed (read or write)
                      ``raw`` - an optional argument describing if the raw transform should be
                      applied.
                      This method processes the flags in the order (or reverse order if
                      ``operation`` is 'write') defined by REVIDX_FLAGS_ORDER, applying the
                      flag processors registered for present flags. The order of flags defined
                      in REVIDX_FLAGS_ORDER needs to be stable to allow non-commutativity.
                      Returns a 2-tuple of ``(text, validatehash)`` where ``text`` is the
                      processed text and ``validatehash`` is a bool indicating whether the
                      returned text should be checked for hash integrity.
                      Note: If the ``raw`` argument is set, it has precedence over the
                      operation and will only update the value of ``validatehash``.
                      """
                      # fast path: no flag processors will run
                      if flags == 0:
                          return text, True
                      if not operation in ('read', 'write'):
                          raise ProgrammingError(_("invalid '%s' operation ") % (operation))
                      # Check all flags are known.
                      if flags & ~REVIDX_KNOWN_FLAGS:
                          raise RevlogError(_("incompatible revision flag '%#x'") %
                                            (flags & ~REVIDX_KNOWN_FLAGS))
                      validatehash = True
                      # Depending on the operation (read or write), the order might be
                      # reversed due to non-commutative transforms.
                      orderedflags = REVIDX_FLAGS_ORDER
                      if operation == 'write':
                          orderedflags = reversed(orderedflags)
                      for flag in orderedflags:
                          # If a flagprocessor has been registered for a known flag, apply the
                          # related operation transform and update result tuple.
                          if flag & flags:
                              vhash = True
                              if flag not in _flagprocessors:
                                  message = _("missing processor for flag '%#x'") % (flag)
                                  raise RevlogError(message)
                              processor = _flagprocessors[flag]
                              if processor is not None:
                                  readtransform, writetransform, rawtransform = processor
                                  if raw:
                                      vhash = rawtransform(self, text)
                                  elif operation == 'read':
                                      text, vhash = readtransform(self, text)
                                  else: # write operation
                                      text, vhash = writetransform(self, text)
                              validatehash = validatehash and vhash
                      return text, validatehash
                  def checkhash(self, text, node, p1=None, p2=None, rev=None):
                      """Check node hash integrity.
                      Available as a function so that subclasses can extend hash mismatch
                      behaviors as needed.
                      """
                      try:
                          if p1 is None and p2 is None:
                              p1, p2 = self.parents(node)
                          if node != self.hash(text, p1, p2):
                              revornode = rev
                              if revornode is None:
                                  revornode = templatefilters.short(hex(node))
                              raise RevlogError(_("integrity check failed on %s:%s")
                                  % (self.indexfile, pycompat.bytestr(revornode)))
                      except RevlogError:
                          if self._censorable and _censoredtext(text):
                              raise error.CensoredNodeError(self.indexfile, node, text)
                          raise
                  def _enforceinlinesize(self, tr, fp=None):
                      """Check if the revlog is too big for inline and convert if so.
                      This should be called after revisions are added to the revlog. If the
                      revlog has grown too large to be an inline revlog, it will convert it
                      to use multiple index and data files.
                      """
                      tiprev = len(self) - 1
                      if (not self._inline or
                          (self.start(tiprev) + self.length(tiprev)) < _maxinline):
                          return
                      trinfo = tr.find(self.indexfile)
                      if trinfo is None:
                          raise RevlogError(_("%s not found in the transaction")
                                            % self.indexfile)
                      trindex = trinfo[2]
                      if trindex is not None:
                          dataoff = self.start(trindex)
                      else:
                          # revlog was stripped at start of transaction, use all leftover data
                          trindex = len(self) - 1
                          dataoff = self.end(tiprev)
                      tr.add(self.datafile, dataoff)
                      if fp:
                          fp.flush()
                          fp.close()
                      with self._datafp('w') as df:
                          for r in self:
                              df.write(self._getsegmentforrevs(r, r)[1])
                      with self._indexfp('w') as fp:
                          self.version &= ~FLAG_INLINE_DATA
                          self._inline = False
                          io = self._io
                          for i in self:
                              e = io.packentry(self.index[i], self.node, self.version, i)
                              fp.write(e)
                          # the temp file replace the real index when we exit the context
                          # manager
                      tr.replace(self.indexfile, trindex * self._io.size)
                      self._chunkclear()
                  def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
                                  node=None, flags=REVIDX_DEFAULT_FLAGS, deltacomputer=None):
                      """add a revision to the log
                      text - the revision data to add
                      transaction - the transaction object used for rollback
                      link - the linkrev data to add
                      p1, p2 - the parent nodeids of the revision
                      cachedelta - an optional precomputed delta
                      node - nodeid of revision; typically node is not specified, and it is
                          computed by default as hash(text, p1, p2), however subclasses might
                          use different hashing method (and override checkhash() in such case)
                      flags - the known flags to set on the revision
-                     deltacomputer - an optional _deltacomputer instance shared between
+                     deltacomputer - an optional deltacomputer instance shared between
                          multiple calls
                      """
                      if link == nullrev:
                          raise RevlogError(_("attempted to add linkrev -1 to %s")
                                            % self.indexfile)
                      if flags:
                          node = node or self.hash(text, p1, p2)
                      rawtext, validatehash = self._processflags(text, flags, 'write')
                      # If the flag processor modifies the revision data, ignore any provided
                      # cachedelta.
                      if rawtext != text:
                          cachedelta = None
                      if len(rawtext) > _maxentrysize:
                          raise RevlogError(
                              _("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")
                              % (self.indexfile, len(rawtext)))
                      node = node or self.hash(rawtext, p1, p2)
                      if node in self.nodemap:
                          return node
                      if validatehash:
                          self.checkhash(rawtext, node, p1=p1, p2=p2)
                      return self.addrawrevision(rawtext, transaction, link, p1, p2, node,
                                                 flags, cachedelta=cachedelta,
                                                 deltacomputer=deltacomputer)
                  def addrawrevision(self, rawtext, transaction, link, p1, p2, node, flags,
                                     cachedelta=None, deltacomputer=None):
                      """add a raw revision with known flags, node and parents
                      useful when reusing a revision not stored in this revlog (ex: received
                      over wire, or read from an external bundle).
                      """
                      dfh = None
                      if not self._inline:
                          dfh = self._datafp("a+")
                      ifh = self._indexfp("a+")
                      try:
                          return self._addrevision(node, rawtext, transaction, link, p1, p2,
                                                   flags, cachedelta, ifh, dfh,
                                                   deltacomputer=deltacomputer)
                      finally:
                          if dfh:
                              dfh.close()
                          ifh.close()
                  def compress(self, data):
                      """Generate a possibly-compressed representation of data."""
                      if not data:
                          return '', data
                      compressed = self._compressor.compress(data)
                      if compressed:
                          # The revlog compressor added the header in the returned data.
                          return '', compressed
                      if data[0:1] == '\0':
                          return '', data
                      return 'u', data
                  def decompress(self, data):
                      """Decompress a revlog chunk.
                      The chunk is expected to begin with a header identifying the
                      format type so it can be routed to an appropriate decompressor.
                      """
                      if not data:
                          return data
                      # Revlogs are read much more frequently than they are written and many
                      # chunks only take microseconds to decompress, so performance is
                      # important here.
                      #
                      # We can make a few assumptions about revlogs:
                      #
                      # 1) the majority of chunks will be compressed (as opposed to inline
                      #    raw data).
                      # 2) decompressing *any* data will likely by at least 10x slower than
                      #    returning raw inline data.
                      # 3) we want to prioritize common and officially supported compression
                      #    engines
                      #
                      # It follows that we want to optimize for "decompress compressed data
                      # when encoded with common and officially supported compression engines"
                      # case over "raw data" and "data encoded by less common or non-official
                      # compression engines." That is why we have the inline lookup first
                      # followed by the compengines lookup.
                      #
                      # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                      # compressed chunks. And this matters for changelog and manifest reads.
                      t = data[0:1]
                      if t == 'x':
                          try:
                              return _zlibdecompress(data)
                          except zlib.error as e:
                              raise RevlogError(_('revlog decompress error: %s') %
                                                stringutil.forcebytestr(e))
                      # '\0' is more common than 'u' so it goes first.
                      elif t == '\0':
                          return data
                      elif t == 'u':
                          return util.buffer(data, 1)
                      try:
                          compressor = self._decompressors[t]
                      except KeyError:
                          try:
                              engine = util.compengines.forrevlogheader(t)
                              compressor = engine.revlogcompressor()
                              self._decompressors[t] = compressor
                          except KeyError:
                              raise RevlogError(_('unknown compression type %r') % t)
                      return compressor.decompress(data)
-                 def _isgooddeltainfo(self, deltainfo, revinfo):
-                     """Returns True if the given delta is good. Good means that it is within
-                     the disk span, disk size, and chain length bounds that we know to be
-                     performant."""
-                     if deltainfo is None:
-                         return False
-                     # - 'deltainfo.distance' is the distance from the base revision --
-                     #   bounding it limits the amount of I/O we need to do.
-                     # - 'deltainfo.compresseddeltalen' is the sum of the total size of
-                     #   deltas we need to apply -- bounding it limits the amount of CPU
-                     #   we consume.
-                     if self._sparserevlog:
-                         # As sparse-read will be used, we can consider that the distance,
-                         # instead of being the span of the whole chunk,
-                         # is the span of the largest read chunk
-                         base = deltainfo.base
-                         if base != nullrev:
-                             deltachain = self._deltachain(base)[0]
-                         else:
-                             deltachain = []
-                         # search for the first non-snapshot revision
-                         for idx, r in enumerate(deltachain):
-                             if not self.issnapshot(r):
-                                 break
-                         deltachain = deltachain[idx:]
-                         chunks = _slicechunk(self, deltachain, deltainfo)
-                         all_span = [_segmentspan(self, revs, deltainfo) for revs in chunks]
-                         distance = max(all_span)
-                     else:
-                         distance = deltainfo.distance
-                     textlen = revinfo.textlen
-                     defaultmax = textlen * 4
-                     maxdist = self._maxdeltachainspan
-                     if not maxdist:
-                         maxdist = distance # ensure the conditional pass
-                     maxdist = max(maxdist, defaultmax)
-                     if self._sparserevlog and maxdist < self._srmingapsize:
-                         # In multiple place, we are ignoring irrelevant data range below a
-                         # certain size. Be also apply this tradeoff here and relax span
-                         # constraint for small enought content.
-                         maxdist = self._srmingapsize
-                     # Bad delta from read span:
+                     #
-                     #   If the span of data read is larger than the maximum allowed.
-                     if maxdist < distance:
-                         return False
-                     # Bad delta from new delta size:
+                     #
-                     #   If the delta size is larger than the target text, storing the
-                     #   delta will be inefficient.
-                     if textlen < deltainfo.deltalen:
-                         return False
-                     # Bad delta from cumulated payload size:
+                     #
-                     #   If the sum of delta get larger than K * target text length.
-                     if textlen * LIMIT_DELTA2TEXT < deltainfo.compresseddeltalen:
-                         return False
-                     # Bad delta from chain length:
+                     #
-                     #   If the number of delta in the chain gets too high.
-                     if self._maxchainlen and  self._maxchainlen < deltainfo.chainlen:
-                         return False
-                     # bad delta from intermediate snapshot size limit
+                     #
-                     #   If an intermediate snapshot size is higher than the limit.  The
-                     #   limit exist to prevent endless chain of intermediate delta to be
-                     #   created.
-                     if (deltainfo.snapshotdepth is not None and
-                             (textlen >> deltainfo.snapshotdepth) < deltainfo.deltalen):
-                         return False
-                     # bad delta if new intermediate snapshot is larger than the previous
-                     # snapshot
-                     if (deltainfo.snapshotdepth
-                             and self.length(deltainfo.base) < deltainfo.deltalen):
-                         return False
-                     return True
                  def _addrevision(self, node, rawtext, transaction, link, p1, p2, flags,
                                   cachedelta, ifh, dfh, alwayscache=False,
                                   deltacomputer=None):
                      """internal function to add revisions to the log
                      see addrevision for argument descriptions.
                      note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                      if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                      be used.
                      invariants:
                      - rawtext is optional (can be None); if not set, cachedelta must be set.
                        if both are set, they must correspond to each other.
                      """
                      if node == nullid:
                          raise RevlogError(_("%s: attempt to add null revision") %
                                            (self.indexfile))
                      if node == wdirid or node in wdirfilenodeids:
                          raise RevlogError(_("%s: attempt to add wdir revision") %
                                            (self.indexfile))
                      if self._inline:
                          fh = ifh
                      else:
                          fh = dfh
                      btext = [rawtext]
                      curr = len(self)
                      prev = curr - 1
                      offset = self.end(prev)
                      p1r, p2r = self.rev(p1), self.rev(p2)
                      # full versions are inserted when the needed deltas
                      # become comparable to the uncompressed text
                      if rawtext is None:
                          # need rawtext size, before changed by flag processors, which is
                          # the non-raw size. use revlog explicitly to avoid filelog's extra
                          # logic that might remove metadata size.
                          textlen = mdiff.patchedsize(revlog.size(self, cachedelta[0]),
                                                      cachedelta[1])
                      else:
                          textlen = len(rawtext)
                      if deltacomputer is None:
-                         deltacomputer = _deltacomputer(self)
+                         deltacomputer = deltautil.deltacomputer(self)
                      revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)
                      # no delta for flag processor revision (see "candelta" for why)
                      # not calling candelta since only one revision needs test, also to
                      # avoid overhead fetching flags again.
                      if flags & REVIDX_RAWTEXT_CHANGING_FLAGS:
                          deltainfo = None
                      else:
                          deltainfo = deltacomputer.finddeltainfo(revinfo, fh)
                      if deltainfo is not None:
                          base = deltainfo.base
                          chainbase = deltainfo.chainbase
                          data = deltainfo.data
                          l = deltainfo.deltalen
                      else:
                          rawtext = deltacomputer.buildtext(revinfo, fh)
                          data = self.compress(rawtext)
                          l = len(data[1]) + len(data[0])
                          base = chainbase = curr
                      e = (offset_type(offset, flags), l, textlen,
                           base, link, p1r, p2r, node)
                      self.index.append(e)
                      self.nodemap[node] = curr
                      entry = self._io.packentry(e, self.node, self.version, curr)
                      self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
                      if alwayscache and rawtext is None:
                          rawtext = deltacomputer.buildtext(revinfo, fh)
                      if type(rawtext) == bytes: # only accept immutable objects
                          self._cache = (node, curr, rawtext)
                      self._chainbasecache[curr] = chainbase
                      return node
                  def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
                      # Files opened in a+ mode have inconsistent behavior on various
                      # platforms. Windows requires that a file positioning call be made
                      # when the file handle transitions between reads and writes. See
                      # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                      # platforms, Python or the platform itself can be buggy. Some versions
                      # of Solaris have been observed to not append at the end of the file
                      # if the file was seeked to before the end. See issue4943 for more.
                      #
                      # We work around this issue by inserting a seek() before writing.
                      # Note: This is likely not necessary on Python 3.
                      ifh.seek(0, os.SEEK_END)
                      if dfh:
                          dfh.seek(0, os.SEEK_END)
                      curr = len(self) - 1
                      if not self._inline:
                          transaction.add(self.datafile, offset)
                          transaction.add(self.indexfile, curr * len(entry))
                          if data[0]:
                              dfh.write(data[0])
                          dfh.write(data[1])
                          ifh.write(entry)
                      else:
                          offset += curr * self._io.size
                          transaction.add(self.indexfile, offset, curr)
                          ifh.write(entry)
                          ifh.write(data[0])
                          ifh.write(data[1])
                          self._enforceinlinesize(transaction, ifh)
                  def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
                      """
                      add a delta group
                      given a set of deltas, add them to the revision log. the
                      first delta is against its parent, which should be in our
                      log, the rest are against the previous delta.
                      If ``addrevisioncb`` is defined, it will be called with arguments of
                      this revlog and the node that was added.
                      """
                      nodes = []
                      r = len(self)
                      end = 0
                      if r:
                          end = self.end(r - 1)
                      ifh = self._indexfp("a+")
                      isize = r * self._io.size
                      if self._inline:
                          transaction.add(self.indexfile, end + isize, r)
                          dfh = None
                      else:
                          transaction.add(self.indexfile, isize, r)
                          transaction.add(self.datafile, end)
                          dfh = self._datafp("a+")
                      def flush():
                          if dfh:
                              dfh.flush()
                          ifh.flush()
                      try:
-                         deltacomputer = _deltacomputer(self)
+                         deltacomputer = deltautil.deltacomputer(self)
                          # loop through our set of deltas
                          for data in deltas:
                              node, p1, p2, linknode, deltabase, delta, flags = data
                              link = linkmapper(linknode)
                              flags = flags or REVIDX_DEFAULT_FLAGS
                              nodes.append(node)
                              if node in self.nodemap:
                                  # this can happen if two branches make the same change
                                  continue
                              for p in (p1, p2):
                                  if p not in self.nodemap:
                                      raise LookupError(p, self.indexfile,
                                                        _('unknown parent'))
                              if deltabase not in self.nodemap:
                                  raise LookupError(deltabase, self.indexfile,
                                                    _('unknown delta base'))
                              baserev = self.rev(deltabase)
                              if baserev != nullrev and self.iscensored(baserev):
                                  # if base is censored, delta must be full replacement in a
                                  # single patch operation
                                  hlen = struct.calcsize(">lll")
                                  oldlen = self.rawsize(baserev)
                                  newlen = len(delta) - hlen
                                  if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
                                      raise error.CensoredBaseError(self.indexfile,
                                                                    self.node(baserev))
                              if not flags and self._peek_iscensored(baserev, delta, flush):
                                  flags |= REVIDX_ISCENSORED
                              # We assume consumers of addrevisioncb will want to retrieve
                              # the added revision, which will require a call to
                              # revision(). revision() will fast path if there is a cache
                              # hit. So, we tell _addrevision() to always cache in this case.
                              # We're only using addgroup() in the context of changegroup
                              # generation so the revision data can always be handled as raw
                              # by the flagprocessor.
                              self._addrevision(node, None, transaction, link,
                                                p1, p2, flags, (baserev, delta),
                                                ifh, dfh,
                                                alwayscache=bool(addrevisioncb),
                                                deltacomputer=deltacomputer)
                              if addrevisioncb:
                                  addrevisioncb(self, node)
                              if not dfh and not self._inline:
                                  # addrevision switched from inline to conventional
                                  # reopen the index
                                  ifh.close()
                                  dfh = self._datafp("a+")
                                  ifh = self._indexfp("a+")
                      finally:
                          if dfh:
                              dfh.close()
                          ifh.close()
                      return nodes
                  def iscensored(self, rev):
                      """Check if a file revision is censored."""
                      if not self._censorable:
                          return False
                      return self.flags(rev) & REVIDX_ISCENSORED
                  def _peek_iscensored(self, baserev, delta, flush):
                      """Quickly check if a delta produces a censored revision."""
                      if not self._censorable:
                          return False
                      # Fragile heuristic: unless new file meta keys are added alphabetically
                      # preceding "censored", all censored revisions are prefixed by
                      # "\1\ncensored:". A delta producing such a censored revision must be a
                      # full-replacement delta, so we inspect the first and only patch in the
                      # delta for this prefix.
                      hlen = struct.calcsize(">lll")
                      if len(delta) <= hlen:
                          return False
                      oldlen = self.rawsize(baserev)
                      newlen = len(delta) - hlen
                      if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
                          return False
                      add = "\1\ncensored:"
                      addlen = len(add)
                      return newlen >= addlen and delta[hlen:hlen + addlen] == add
                  def getstrippoint(self, minlink):
                      """find the minimum rev that must be stripped to strip the linkrev
                      Returns a tuple containing the minimum rev and a set of all revs that
                      have linkrevs that will be broken by this strip.
                      """
                      brokenrevs = set()
                      strippoint = len(self)
                      heads = {}
                      futurelargelinkrevs = set()
                      for head in self.headrevs():
                          headlinkrev = self.linkrev(head)
                          heads[head] = headlinkrev
                          if headlinkrev >= minlink:
                              futurelargelinkrevs.add(headlinkrev)
                      # This algorithm involves walking down the rev graph, starting at the
                      # heads. Since the revs are topologically sorted according to linkrev,
                      # once all head linkrevs are below the minlink, we know there are
                      # no more revs that could have a linkrev greater than minlink.
                      # So we can stop walking.
                      while futurelargelinkrevs:
                          strippoint -= 1
                          linkrev = heads.pop(strippoint)
                          if linkrev < minlink:
                              brokenrevs.add(strippoint)
                          else:
                              futurelargelinkrevs.remove(linkrev)
                          for p in self.parentrevs(strippoint):
                              if p != nullrev:
                                  plinkrev = self.linkrev(p)
                                  heads[p] = plinkrev
                                  if plinkrev >= minlink:
                                      futurelargelinkrevs.add(plinkrev)
                      return strippoint, brokenrevs
                  def strip(self, minlink, transaction):
                      """truncate the revlog on the first revision with a linkrev >= minlink
                      This function is called when we're stripping revision minlink and
                      its descendants from the repository.
                      We have to remove all revisions with linkrev >= minlink, because
                      the equivalent changelog revisions will be renumbered after the
                      strip.
                      So we truncate the revlog on the first of these revisions, and
                      trust that the caller has saved the revisions that shouldn't be
                      removed and that it'll re-add them after this truncation.
                      """
                      if len(self) == 0:
                          return
                      rev, _ = self.getstrippoint(minlink)
                      if rev == len(self):
                          return
                      # first truncate the files on disk
                      end = self.start(rev)
                      if not self._inline:
                          transaction.add(self.datafile, end)
                          end = rev * self._io.size
                      else:
                          end += rev * self._io.size
                      transaction.add(self.indexfile, end)
                      # then reset internal state in memory to forget those revisions
                      self._cache = None
                      self._chaininfocache = {}
                      self._chunkclear()
                      for x in pycompat.xrange(rev, len(self)):
                          del self.nodemap[self.node(x)]
                      del self.index[rev:-1]
                      self._nodepos = None
                  def checksize(self):
                      expected = 0
                      if len(self):
                          expected = max(0, self.end(len(self) - 1))
                      try:
                          with self._datafp() as f:
                              f.seek(0, 2)
                              actual = f.tell()
                          dd = actual - expected
                      except IOError as inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          dd = 0
                      try:
                          f = self.opener(self.indexfile)
                          f.seek(0, 2)
                          actual = f.tell()
                          f.close()
                          s = self._io.size
                          i = max(0, actual // s)
                          di = actual - (i * s)
                          if self._inline:
                              databytes = 0
                              for r in self:
                                  databytes += max(0, self.length(r))
                              dd = 0
                              di = actual - len(self) * s - databytes
                      except IOError as inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          di = 0
                      return (dd, di)
                  def files(self):
                      res = [self.indexfile]
                      if not self._inline:
                          res.append(self.datafile)
                      return res
                  def emitrevisiondeltas(self, requests):
                      frev = self.rev
                      prevrev = None
                      for request in requests:
                          node = request.node
                          rev = frev(node)
                          if prevrev is None:
                              prevrev = self.index[rev][5]
                          # Requesting a full revision.
                          if request.basenode == nullid:
                              baserev = nullrev
                          # Requesting an explicit revision.
                          elif request.basenode is not None:
                              baserev = frev(request.basenode)
                          # Allowing us to choose.
                          else:
                              p1rev, p2rev = self.parentrevs(rev)
                              deltaparentrev = self.deltaparent(rev)
                              # Avoid sending full revisions when delta parent is null. Pick
                              # prev in that case. It's tempting to pick p1 in this case, as
                              # p1 will be smaller in the common case. However, computing a
                              # delta against p1 may require resolving the raw text of p1,
                              # which could be expensive. The revlog caches should have prev
                              # cached, meaning less CPU for delta generation. There is
                              # likely room to add a flag and/or config option to control this
                              # behavior.
                              if deltaparentrev == nullrev and self._storedeltachains:
                                  baserev = prevrev
                              # Revlog is configured to use full snapshot for a reason.
                              # Stick to full snapshot.
                              elif deltaparentrev == nullrev:
                                  baserev = nullrev
                              # Pick previous when we can't be sure the base is available
                              # on consumer.
                              elif deltaparentrev not in (p1rev, p2rev, prevrev):
                                  baserev = prevrev
                              else:
                                  baserev = deltaparentrev
                              if baserev != nullrev and not self.candelta(baserev, rev):
                                  baserev = nullrev
                          revision = None
                          delta = None
                          baserevisionsize = None
                          if self.iscensored(baserev) or self.iscensored(rev):
                              try:
                                  revision = self.revision(node, raw=True)
                              except error.CensoredNodeError as e:
                                  revision = e.tombstone
                              if baserev != nullrev:
                                  baserevisionsize = self.rawsize(baserev)
                          elif baserev == nullrev:
                              revision = self.revision(node, raw=True)
                          else:
                              delta = self.revdiff(baserev, rev)
                          extraflags = REVIDX_ELLIPSIS if request.ellipsis else 0
                          yield revlogrevisiondelta(
                              node=node,
                              p1node=request.p1node,
                              p2node=request.p2node,
                              linknode=request.linknode,
                              basenode=self.node(baserev),
                              flags=self.flags(rev) | extraflags,
                              baserevisionsize=baserevisionsize,
                              revision=revision,
                              delta=delta)
                          prevrev = rev
                  DELTAREUSEALWAYS = 'always'
                  DELTAREUSESAMEREVS = 'samerevs'
                  DELTAREUSENEVER = 'never'
                  DELTAREUSEFULLADD = 'fulladd'
                  DELTAREUSEALL = {'always', 'samerevs', 'never', 'fulladd'}
                  def clone(self, tr, destrevlog, addrevisioncb=None,
                            deltareuse=DELTAREUSESAMEREVS, deltabothparents=None):
                      """Copy this revlog to another, possibly with format changes.
                      The destination revlog will contain the same revisions and nodes.
                      However, it may not be bit-for-bit identical due to e.g. delta encoding
                      differences.
                      The ``deltareuse`` argument control how deltas from the existing revlog
                      are preserved in the destination revlog. The argument can have the
                      following values:
                      DELTAREUSEALWAYS
                         Deltas will always be reused (if possible), even if the destination
                         revlog would not select the same revisions for the delta. This is the
                         fastest mode of operation.
                      DELTAREUSESAMEREVS
                         Deltas will be reused if the destination revlog would pick the same
                         revisions for the delta. This mode strikes a balance between speed
                         and optimization.
                      DELTAREUSENEVER
                         Deltas will never be reused. This is the slowest mode of execution.
                         This mode can be used to recompute deltas (e.g. if the diff/delta
                         algorithm changes).
                      Delta computation can be slow, so the choice of delta reuse policy can
                      significantly affect run time.
                      The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                      two extremes. Deltas will be reused if they are appropriate. But if the
                      delta could choose a better revision, it will do so. This means if you
                      are converting a non-generaldelta revlog to a generaldelta revlog,
                      deltas will be recomputed if the delta's parent isn't a parent of the
                      revision.
                      In addition to the delta policy, the ``deltabothparents`` argument
                      controls whether to compute deltas against both parents for merges.
                      By default, the current default is used.
                      """
                      if deltareuse not in self.DELTAREUSEALL:
                          raise ValueError(_('value for deltareuse invalid: %s') % deltareuse)
                      if len(destrevlog):
                          raise ValueError(_('destination revlog is not empty'))
                      if getattr(self, 'filteredrevs', None):
                          raise ValueError(_('source revlog has filtered revisions'))
                      if getattr(destrevlog, 'filteredrevs', None):
                          raise ValueError(_('destination revlog has filtered revisions'))
                      # lazydeltabase controls whether to reuse a cached delta, if possible.
                      oldlazydeltabase = destrevlog._lazydeltabase
                      oldamd = destrevlog._deltabothparents
                      try:
                          if deltareuse == self.DELTAREUSEALWAYS:
                              destrevlog._lazydeltabase = True
                          elif deltareuse == self.DELTAREUSESAMEREVS:
                              destrevlog._lazydeltabase = False
                          destrevlog._deltabothparents = deltabothparents or oldamd
                          populatecachedelta = deltareuse in (self.DELTAREUSEALWAYS,
                                                              self.DELTAREUSESAMEREVS)
-                         deltacomputer = _deltacomputer(destrevlog)
+                         deltacomputer = deltautil.deltacomputer(destrevlog)
                          index = self.index
                          for rev in self:
                              entry = index[rev]
                              # Some classes override linkrev to take filtered revs into
                              # account. Use raw entry from index.
                              flags = entry[0] & 0xffff
                              linkrev = entry[4]
                              p1 = index[entry[5]][7]
                              p2 = index[entry[6]][7]
                              node = entry[7]
                              # (Possibly) reuse the delta from the revlog if allowed and
                              # the revlog chunk is a delta.
                              cachedelta = None
                              rawtext = None
                              if populatecachedelta:
                                  dp = self.deltaparent(rev)
                                  if dp != nullrev:
                                      cachedelta = (dp, bytes(self._chunk(rev)))
                              if not cachedelta:
                                  rawtext = self.revision(rev, raw=True)
                              if deltareuse == self.DELTAREUSEFULLADD:
                                  destrevlog.addrevision(rawtext, tr, linkrev, p1, p2,
                                                         cachedelta=cachedelta,
                                                         node=node, flags=flags,
                                                         deltacomputer=deltacomputer)
                              else:
                                  ifh = destrevlog.opener(destrevlog.indexfile, 'a+',
                                                          checkambig=False)
                                  dfh = None
                                  if not destrevlog._inline:
                                      dfh = destrevlog.opener(destrevlog.datafile, 'a+')
                                  try:
                                      destrevlog._addrevision(node, rawtext, tr, linkrev, p1,
                                                              p2, flags, cachedelta, ifh, dfh,
                                                              deltacomputer=deltacomputer)
                                  finally:
                                      if dfh:
                                          dfh.close()
                                      ifh.close()
                              if addrevisioncb:
                                  addrevisioncb(self, rev, node)
                      finally:
                          destrevlog._lazydeltabase = oldlazydeltabase
                          destrevlog._deltabothparents = oldamd

mercurial/revlogutils/constants.py

0 0 -3

              # revlogdeltas.py - constant used for revlog logic
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              # Copyright 2018 Octobus <contact@octobus.net>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              """Helper class to compute deltas stored inside revlogs"""
              from __future__ import absolute_import
              from .. import (
                  util,
              )
              # revlog header flags
              REVLOGV0 = 0
              REVLOGV1 = 1
              # Dummy value until file format is finalized.
              # Reminder: change the bounds check in revlog.__init__ when this is changed.
              REVLOGV2 = 0xDEAD
              FLAG_INLINE_DATA = (1 << 16)
              FLAG_GENERALDELTA = (1 << 17)
              REVLOG_DEFAULT_FLAGS = FLAG_INLINE_DATA
              REVLOG_DEFAULT_FORMAT = REVLOGV1
              REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
              REVLOGV1_FLAGS = FLAG_INLINE_DATA | FLAG_GENERALDELTA
              REVLOGV2_FLAGS = REVLOGV1_FLAGS
              # revlog index flags
              REVIDX_ISCENSORED = (1 << 15) # revision has censor metadata, must be verified
              REVIDX_ELLIPSIS = (1 << 14) # revision hash does not match data (narrowhg)
              REVIDX_EXTSTORED = (1 << 13) # revision data is stored externally
              REVIDX_DEFAULT_FLAGS = 0
              # stable order in which flags need to be processed and their processors applied
              REVIDX_FLAGS_ORDER = [
                  REVIDX_ISCENSORED,
                  REVIDX_ELLIPSIS,
                  REVIDX_EXTSTORED,
              ]
              REVIDX_KNOWN_FLAGS = util.bitsfrom(REVIDX_FLAGS_ORDER)
              # bitmark for flags that could cause rawdata content change
              REVIDX_RAWTEXT_CHANGING_FLAGS = REVIDX_ISCENSORED | REVIDX_EXTSTORED
-             # maximum <delta-chain-data>/<revision-text-length> ratio
-             LIMIT_DELTA2TEXT = 2

mercurial/revlogutils/deltas.py mercurial/revlog.py

0 copied +204 -2650

This diff has been collapsed as it changes many lines, (2854 lines changed) Show them Hide them
			@@ -1,3180 +1,734 b''
	1		# revlog.py - storage back-end for mercurial
		1	# revlogdeltas.py - Logic around delta computation for revlog
	2	2	#
	3	3	# Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
		4	# Copyright 2018 Octobus <contact@octobus.net>
	4	5	#
	5	6	# This software may be used and distributed according to the terms of the
	6	7	# GNU General Public License version 2 or any later version.
	7
	8		"""Storage back-end for Mercurial.
	9
	10		This provides efficient delta storage with O(1) retrieve and append
	11		and O(changes) merge between branches.
	12		"""
		8	"""Helper class to compute deltas stored inside revlogs"""
	13	9
	14	10	from __future__ import absolute_import
	15	11
	16		import collections
	17		import contextlib
	18		import errno
	19		import hashlib
	20	12	import heapq
	21		import os
	22		import re
	23	13	import struct
	24		import zlib
	25	14
	26	15	# import stuff from node for others to import from revlog
	27		from .node import (
	28		bin,
	29		hex,
	30		nullhex,
	31		nullid,
		16	from ..node import (
	32	17	nullrev,
	33		wdirfilenodeids,
	34		wdirhex,
	35		wdirid,
	36		wdirrev,
	37	18	)
	38		from .i18n import _
	39		from .revlogutils.constants import (
	40		FLAG_GENERALDELTA,
	41		FLAG_INLINE_DATA,
	42		LIMIT_DELTA2TEXT,
	43		REVIDX_DEFAULT_FLAGS,
	44		REVIDX_ELLIPSIS,
	45		REVIDX_EXTSTORED,
	46		REVIDX_FLAGS_ORDER,
		19	from ..i18n import _
		20
		21	from .constants import (
	47	22	REVIDX_ISCENSORED,
	48		REVIDX_KNOWN_FLAGS,
	49	23	REVIDX_RAWTEXT_CHANGING_FLAGS,
	50		REVLOGV0,
	51		REVLOGV1,
	52		REVLOGV1_FLAGS,
	53		REVLOGV2,
	54		REVLOGV2_FLAGS,
	55		REVLOG_DEFAULT_FLAGS,
	56		REVLOG_DEFAULT_FORMAT,
	57		REVLOG_DEFAULT_VERSION,
	58	24	)
	59		from .thirdparty import (
		25
		26	from ..thirdparty import (
	60	27	attr,
	61	28	)
	62		from . import (
	63		ancestor,
		29
		30	from .. import (
	64	31	error,
	65	32	mdiff,
	66		policy,
	67		pycompat,
	68		repository,
	69		templatefilters,
	70		util,
	71	33	)
	72		from .utils import (
	73		interfaceutil,
	74		stringutil,
	75		)
	76
	77		# blanked usage of all the name to prevent pyflakes constraints
	78		# We need these name available in the module for extensions.
	79		REVLOGV0
	80		REVLOGV1
	81		REVLOGV2
	82		FLAG_INLINE_DATA
	83		FLAG_GENERALDELTA
	84		REVLOG_DEFAULT_FLAGS
	85		REVLOG_DEFAULT_FORMAT
	86		REVLOG_DEFAULT_VERSION
	87		REVLOGV1_FLAGS
	88		REVLOGV2_FLAGS
	89		REVIDX_ISCENSORED
	90		REVIDX_ELLIPSIS
	91		REVIDX_EXTSTORED
	92		REVIDX_DEFAULT_FLAGS
	93		REVIDX_FLAGS_ORDER
	94		REVIDX_KNOWN_FLAGS
	95		REVIDX_RAWTEXT_CHANGING_FLAGS
	96
	97		parsers = policy.importmod(r'parsers')
	98
	99		# Aliased for performance.
	100		_zlibdecompress = zlib.decompress
	101
	102		# max size of revlog with inline data
	103		_maxinline = 131072
	104		_chunksize = 1048576
	105	34
	106	35	RevlogError = error.RevlogError
	107		LookupError = error.LookupError
	108		AmbiguousPrefixLookupError = error.AmbiguousPrefixLookupError
	109	36	CensoredNodeError = error.CensoredNodeError
	110		ProgrammingError = error.ProgrammingError
	111
	112		# Store flag processors (cf. 'addflagprocessor()' to register)
	113		_flagprocessors = {
	114		REVIDX_ISCENSORED: None,
	115		}
	116
	117		_mdre = re.compile('\1\n')
	118		def parsemeta(text):
	119		"""return (metadatadict, metadatasize)"""
	120		# text can be buffer, so we can't use .startswith or .index
	121		if text[:2] != '\1\n':
	122		return None, None
	123		s = _mdre.search(text, 2).start()
	124		mtext = text[2:s]
	125		meta = {}
	126		for l in mtext.splitlines():
	127		k, v = l.split(": ", 1)
	128		meta[k] = v
	129		return meta, (s + 2)
	130
	131		def packmeta(meta, text):
	132		keys = sorted(meta)
	133		metatext = "".join("%s: %s\n" % (k, meta[k]) for k in keys)
	134		return "\1\n%s\1\n%s" % (metatext, text)
	135
	136		def _censoredtext(text):
	137		m, offs = parsemeta(text)
	138		return m and "censored" in m
	139
	140		def addflagprocessor(flag, processor):
	141		"""Register a flag processor on a revision data flag.
	142	37
	143		Invariant:
	144		- Flags need to be defined in REVIDX_KNOWN_FLAGS and REVIDX_FLAGS_ORDER,
	145		and REVIDX_RAWTEXT_CHANGING_FLAGS if they can alter rawtext.
	146		- Only one flag processor can be registered on a specific flag.
	147		- flagprocessors must be 3-tuples of functions (read, write, raw) with the
	148		following signatures:
	149		- (read) f(self, rawtext) -> text, bool
	150		- (write) f(self, text) -> rawtext, bool
	151		- (raw) f(self, rawtext) -> bool
	152		"text" is presented to the user. "rawtext" is stored in revlog data, not
	153		directly visible to the user.
	154		The boolean returned by these transforms is used to determine whether
	155		the returned text can be used for hash integrity checking. For example,
	156		if "write" returns False, then "text" is used to generate hash. If
	157		"write" returns True, that basically means "rawtext" returned by "write"
	158		should be used to generate hash. Usually, "write" and "read" return
	159		different booleans. And "raw" returns a same boolean as "write".
	160
	161		Note: The 'raw' transform is used for changegroup generation and in some
	162		debug commands. In this case the transform only indicates whether the
	163		contents can be used for hash integrity checks.
	164		"""
	165		if not flag & REVIDX_KNOWN_FLAGS:
	166		msg = _("cannot register processor on unknown flag '%#x'.") % (flag)
	167		raise ProgrammingError(msg)
	168		if flag not in REVIDX_FLAGS_ORDER:
	169		msg = _("flag '%#x' undefined in REVIDX_FLAGS_ORDER.") % (flag)
	170		raise ProgrammingError(msg)
	171		if flag in _flagprocessors:
	172		msg = _("cannot register multiple processors on flag '%#x'.") % (flag)
	173		raise error.Abort(msg)
	174		_flagprocessors[flag] = processor
	175
	176		def getoffset(q):
	177		return int(q >> 16)
	178
	179		def gettype(q):
	180		return int(q & 0xFFFF)
	181
	182		def offset_type(offset, type):
	183		if (type & ~REVIDX_KNOWN_FLAGS) != 0:
	184		raise ValueError('unknown revlog index flags')
	185		return int(int(offset) << 16 \| type)
	186
	187		_nullhash = hashlib.sha1(nullid)
	188
	189		def hash(text, p1, p2):
	190		"""generate a hash from the given text and its parent hashes
	191
	192		This hash combines both the current file contents and its history
	193		in a manner that makes it easy to distinguish nodes with the same
	194		content in the revision graph.
	195		"""
	196		# As of now, if one of the parent node is null, p2 is null
	197		if p2 == nullid:
	198		# deep copy of a hash is faster than creating one
	199		s = _nullhash.copy()
	200		s.update(p1)
	201		else:
	202		# none of the parent nodes are nullid
	203		if p1 < p2:
	204		a = p1
	205		b = p2
	206		else:
	207		a = p2
	208		b = p1
	209		s = hashlib.sha1(a)
	210		s.update(b)
	211		s.update(text)
	212		return s.digest()
		38	# maximum <delta-chain-data>/<revision-text-length> ratio
		39	LIMIT_DELTA2TEXT = 2
	213	40
	214	41	class _testrevlog(object):
	215	42	"""minimalist fake revlog to use in doctests"""
	216	43
	217	44	def __init__(self, data, density=0.5, mingap=0):
	218	45	"""data is an list of revision payload boundaries"""
	219	46	self._data = data
	220	47	self._srdensitythreshold = density
	221	48	self._srmingapsize = mingap
	222	49
	223	50	def start(self, rev):
	224	51	if rev == 0:
	225	52	return 0
	226	53	return self._data[rev - 1]
	227	54
	228	55	def end(self, rev):
	229	56	return self._data[rev]
	230	57
	231	58	def length(self, rev):
	232	59	return self.end(rev) - self.start(rev)
	233	60
	234	61	def __len__(self):
	235	62	return len(self._data)
	236	63
	237		def ~~_trim~~chunk(revlog, revs, ~~startidx~~, ~~endidx~~=None):
	238		"""returns revs[startidx:endidx] without empty trailing revs
	239
	240		Doctest Setup
	241		>>> revlog = _testrevlog([
	242		... 5, #0
	243		... 10, #1
	244		... 12, #2
	245		... 12, #3 (empty)
	246		... 17, #4
	247		... 21, #5
	248		... 21, #6 (empty)
	249		... ])
	250
	251		Contiguous cases:
	252		>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0)
	253		[0, 1, 2, 3, 4, 5]
	254		>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 5)
	255		[0, 1, 2, 3, 4]
	256		>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 4)
	257		[0, 1, 2]
	258		>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 2, 4)
	259		[2]
	260		>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3)
	261		[3, 4, 5]
	262		>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3, 5)
	263		[3, 4]
	264
	265		Discontiguous cases:
	266		>>> _trimchunk(revlog, [1, 3, 5, 6], 0)
	267		[1, 3, 5]
	268		>>> _trimchunk(revlog, [1, 3, 5, 6], 0, 2)
	269		[1]
	270		>>> _trimchunk(revlog, [1, 3, 5, 6], 1, 3)
	271		[3, 5]
	272		>>> _trimchunk(revlog, [1, 3, 5, 6], 1)
	273		[3, 5]
	274		"""
	275		length = revlog.length
	276
	277		if endidx is None:
	278		endidx = len(revs)
	279
	280		# If we have a non-emtpy delta candidate, there are nothing to trim
	281		if revs[endidx - 1] < len(revlog):
	282		# Trim empty revs at the end, except the very first revision of a chain
	283		while (endidx > 1
	284		and endidx > startidx
	285		and length(revs[endidx - 1]) == 0):
	286		endidx -= 1
	287
	288		return revs[startidx:endidx]
	289
	290		def _segmentspan(revlog, revs, deltainfo=None):
	291		"""Get the byte span of a segment of revisions
	292
	293		revs is a sorted array of revision numbers
	294
	295		>>> revlog = _testrevlog([
	296		... 5, #0
	297		... 10, #1
	298		... 12, #2
	299		... 12, #3 (empty)
	300		... 17, #4
	301		... ])
	302
	303		>>> _segmentspan(revlog, [0, 1, 2, 3, 4])
	304		17
	305		>>> _segmentspan(revlog, [0, 4])
	306		17
	307		>>> _segmentspan(revlog, [3, 4])
	308		5
	309		>>> _segmentspan(revlog, [1, 2, 3,])
	310		7
	311		>>> _segmentspan(revlog, [1, 3])
	312		7
	313		"""
	314		if not revs:
	315		return 0
	316		if deltainfo is not None and len(revlog) <= revs[-1]:
	317		if len(revs) == 1:
	318		return deltainfo.deltalen
	319		offset = revlog.end(len(revlog) - 1)
	320		end = deltainfo.deltalen + offset
	321		else:
	322		end = revlog.end(revs[-1])
	323		return end - revlog.start(revs[0])
	324
	325		def _slicechunk(revlog, revs, deltainfo=None, targetsize=None):
		64	def slicechunk(revlog, revs, deltainfo=None, targetsize=None):
	326	65	"""slice revs to reduce the amount of unrelated data to be read from disk.
	327	66
	328	67	``revs`` is sliced into groups that should be read in one time.
	329	68	Assume that revs are sorted.
	330	69
	331	70	The initial chunk is sliced until the overall density (payload/chunks-span
	332	71	ratio) is above `revlog._srdensitythreshold`. No gap smaller than
	333	72	`revlog._srmingapsize` is skipped.
	334	73
	335	74	If `targetsize` is set, no chunk larger than `targetsize` will be yield.
	336	75	For consistency with other slicing choice, this limit won't go lower than
	337	76	`revlog._srmingapsize`.
	338	77
	339	78	If individual revisions chunk are larger than this limit, they will still
	340	79	be raised individually.
	341	80
	342	81	>>> revlog = _testrevlog([
	343	82	... 5, #00 (5)
	344	83	... 10, #01 (5)
	345	84	... 12, #02 (2)
	346	85	... 12, #03 (empty)
	347	86	... 27, #04 (15)
	348	87	... 31, #05 (4)
	349	88	... 31, #06 (empty)
	350	89	... 42, #07 (11)
	351	90	... 47, #08 (5)
	352	91	... 47, #09 (empty)
	353	92	... 48, #10 (1)
	354	93	... 51, #11 (3)
	355	94	... 74, #12 (23)
	356	95	... 85, #13 (11)
	357	96	... 86, #14 (1)
	358	97	... 91, #15 (5)
	359	98	... ])
	360	99
	361		>>> list(_slicechunk(revlog, list(range(16))))
		100	>>> list(slicechunk(revlog, list(range(16))))
	362	101	[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
	363		>>> list(_slicechunk(revlog, [0, 15]))
		102	>>> list(slicechunk(revlog, [0, 15]))
	364	103	[[0], [15]]
	365		>>> list(_slicechunk(revlog, [0, 11, 15]))
		104	>>> list(slicechunk(revlog, [0, 11, 15]))
	366	105	[[0], [11], [15]]
	367		>>> list(_slicechunk(revlog, [0, 11, 13, 15]))
		106	>>> list(slicechunk(revlog, [0, 11, 13, 15]))
	368	107	[[0], [11, 13, 15]]
	369		>>> list(_slicechunk(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
		108	>>> list(slicechunk(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
	370	109	[[1, 2], [5, 8, 10, 11], [14]]
	371	110
	372	111	Slicing with a maximum chunk size
	373		>>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=15))
		112	>>> list(slicechunk(revlog, [0, 11, 13, 15], targetsize=15))
	374	113	[[0], [11], [13], [15]]
	375		>>> list(_slicechunk(revlog, [0, 11, 13, 15], targetsize=20))
		114	>>> list(slicechunk(revlog, [0, 11, 13, 15], targetsize=20))
	376	115	[[0], [11], [13, 15]]
	377	116	"""
	378	117	if targetsize is not None:
	379	118	targetsize = max(targetsize, revlog._srmingapsize)
	380	119	# targetsize should not be specified when evaluating delta candidates:
	381	120	# * targetsize is used to ensure we stay within specification when reading,
	382	121	# * deltainfo is used to pick are good delta chain when writing.
	383	122	if not (deltainfo is None or targetsize is None):
	384	123	msg = 'cannot use `targetsize` with a `deltainfo`'
	385	124	raise error.ProgrammingError(msg)
	386	125	for chunk in _slicechunktodensity(revlog, revs,
	387	126	deltainfo,
	388	127	revlog._srdensitythreshold,
	389	128	revlog._srmingapsize):
	390	129	for subchunk in _slicechunktosize(revlog, chunk, targetsize):
	391	130	yield subchunk
	392	131
	393	132	def _slicechunktosize(revlog, revs, targetsize=None):
	394	133	"""slice revs to match the target size
	395	134
	396	135	This is intended to be used on chunk that density slicing selected by that
	397	136	are still too large compared to the read garantee of revlog. This might
	398	137	happens when "minimal gap size" interrupted the slicing or when chain are
	399	138	built in a way that create large blocks next to each other.
	400	139
	401	140	>>> revlog = _testrevlog([
	402	141	... 3, #0 (3)
	403	142	... 5, #1 (2)
	404	143	... 6, #2 (1)
	405	144	... 8, #3 (2)
	406	145	... 8, #4 (empty)
	407	146	... 11, #5 (3)
	408	147	... 12, #6 (1)
	409	148	... 13, #7 (1)
	410	149	... 14, #8 (1)
	411	150	... ])
	412	151
	413	152	Cases where chunk is already small enough
	414	153	>>> list(_slicechunktosize(revlog, [0], 3))
	415	154	[[0]]
	416	155	>>> list(_slicechunktosize(revlog, [6, 7], 3))
	417	156	[[6, 7]]
	418	157	>>> list(_slicechunktosize(revlog, [0], None))
	419	158	[[0]]
	420	159	>>> list(_slicechunktosize(revlog, [6, 7], None))
	421	160	[[6, 7]]
	422	161
	423	162	cases where we need actual slicing
	424	163	>>> list(_slicechunktosize(revlog, [0, 1], 3))
	425	164	[[0], [1]]
	426	165	>>> list(_slicechunktosize(revlog, [1, 3], 3))
	427	166	[[1], [3]]
	428	167	>>> list(_slicechunktosize(revlog, [1, 2, 3], 3))
	429	168	[[1, 2], [3]]
	430	169	>>> list(_slicechunktosize(revlog, [3, 5], 3))
	431	170	[[3], [5]]
	432	171	>>> list(_slicechunktosize(revlog, [3, 4, 5], 3))
	433	172	[[3], [5]]
	434	173	>>> list(_slicechunktosize(revlog, [5, 6, 7, 8], 3))
	435	174	[[5], [6, 7, 8]]
	436	175	>>> list(_slicechunktosize(revlog, [0, 1, 2, 3, 4, 5, 6, 7, 8], 3))
	437	176	[[0], [1, 2], [3], [5], [6, 7, 8]]
	438	177
	439	178	Case with too large individual chunk (must return valid chunk)
	440	179	>>> list(_slicechunktosize(revlog, [0, 1], 2))
	441	180	[[0], [1]]
	442	181	>>> list(_slicechunktosize(revlog, [1, 3], 1))
	443	182	[[1], [3]]
	444	183	>>> list(_slicechunktosize(revlog, [3, 4, 5], 2))
	445	184	[[3], [5]]
	446	185	"""
	447	186	assert targetsize is None or 0 <= targetsize
	448		if targetsize is None or _segmentspan(revlog, revs) <= targetsize:
		187	if targetsize is None or segmentspan(revlog, revs) <= targetsize:
	449	188	yield revs
	450	189	return
	451	190
	452	191	startrevidx = 0
	453	192	startdata = revlog.start(revs[0])
	454	193	endrevidx = 0
	455	194	iterrevs = enumerate(revs)
	456	195	next(iterrevs) # skip first rev.
	457	196	for idx, r in iterrevs:
	458	197	span = revlog.end(r) - startdata
	459	198	if span <= targetsize:
	460	199	endrevidx = idx
	461	200	else:
	462	201	chunk = _trimchunk(revlog, revs, startrevidx, endrevidx + 1)
	463	202	if chunk:
	464	203	yield chunk
	465	204	startrevidx = idx
	466	205	startdata = revlog.start(r)
	467	206	endrevidx = idx
	468	207	yield _trimchunk(revlog, revs, startrevidx)
	469	208
	470	209	def _slicechunktodensity(revlog, revs, deltainfo=None, targetdensity=0.5,
	471	210	mingapsize=0):
	472	211	"""slice revs to reduce the amount of unrelated data to be read from disk.
	473	212
	474	213	``revs`` is sliced into groups that should be read in one time.
	475	214	Assume that revs are sorted.
	476	215
	477	216	``deltainfo`` is a _deltainfo instance of a revision that we would append
	478	217	to the top of the revlog.
	479	218
	480	219	The initial chunk is sliced until the overall density (payload/chunks-span
	481	220	ratio) is above `targetdensity`. No gap smaller than `mingapsize` is
	482	221	skipped.
	483	222
	484	223	>>> revlog = _testrevlog([
	485	224	... 5, #00 (5)
	486	225	... 10, #01 (5)
	487	226	... 12, #02 (2)
	488	227	... 12, #03 (empty)
	489	228	... 27, #04 (15)
	490	229	... 31, #05 (4)
	491	230	... 31, #06 (empty)
	492	231	... 42, #07 (11)
	493	232	... 47, #08 (5)
	494	233	... 47, #09 (empty)
	495	234	... 48, #10 (1)
	496	235	... 51, #11 (3)
	497	236	... 74, #12 (23)
	498	237	... 85, #13 (11)
	499	238	... 86, #14 (1)
	500	239	... 91, #15 (5)
	501	240	... ])
	502	241
	503	242	>>> list(_slicechunktodensity(revlog, list(range(16))))
	504	243	[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]]
	505	244	>>> list(_slicechunktodensity(revlog, [0, 15]))
	506	245	[[0], [15]]
	507	246	>>> list(_slicechunktodensity(revlog, [0, 11, 15]))
	508	247	[[0], [11], [15]]
	509	248	>>> list(_slicechunktodensity(revlog, [0, 11, 13, 15]))
	510	249	[[0], [11, 13, 15]]
	511	250	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14]))
	512	251	[[1, 2], [5, 8, 10, 11], [14]]
	513	252	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
	514	253	... mingapsize=20))
	515	254	[[1, 2, 3, 5, 8, 10, 11], [14]]
	516	255	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
	517	256	... targetdensity=0.95))
	518	257	[[1, 2], [5], [8, 10, 11], [14]]
	519	258	>>> list(_slicechunktodensity(revlog, [1, 2, 3, 5, 8, 10, 11, 14],
	520	259	... targetdensity=0.95, mingapsize=12))
	521	260	[[1, 2], [5, 8, 10, 11], [14]]
	522	261	"""
	523	262	start = revlog.start
	524	263	length = revlog.length
	525	264
	526	265	if len(revs) <= 1:
	527	266	yield revs
	528	267	return
	529	268
	530	269	nextrev = len(revlog)
	531	270	nextoffset = revlog.end(nextrev - 1)
	532	271
	533	272	if deltainfo is None:
	534		deltachainspan = _segmentspan(revlog, revs)
		273	deltachainspan = segmentspan(revlog, revs)
	535	274	chainpayload = sum(length(r) for r in revs)
	536	275	else:
	537	276	deltachainspan = deltainfo.distance
	538	277	chainpayload = deltainfo.compresseddeltalen
	539	278
	540	279	if deltachainspan < mingapsize:
	541	280	yield revs
	542	281	return
	543	282
	544	283	readdata = deltachainspan
	545	284
	546	285	if deltachainspan:
	547	286	density = chainpayload / float(deltachainspan)
	548	287	else:
	549	288	density = 1.0
	550	289
	551	290	if density >= targetdensity:
	552	291	yield revs
	553	292	return
	554	293
	555	294	if deltainfo is not None and deltainfo.deltalen:
	556	295	revs = list(revs)
	557	296	revs.append(nextrev)
	558	297
	559	298	# Store the gaps in a heap to have them sorted by decreasing size
	560	299	gapsheap = []
	561	300	heapq.heapify(gapsheap)
	562	301	prevend = None
	563	302	for i, rev in enumerate(revs):
	564	303	if rev < nextrev:
	565	304	revstart = start(rev)
	566	305	revlen = length(rev)
	567	306	else:
	568	307	revstart = nextoffset
	569	308	revlen = deltainfo.deltalen
	570	309
	571	310	# Skip empty revisions to form larger holes
	572	311	if revlen == 0:
	573	312	continue
	574	313
	575	314	if prevend is not None:
	576	315	gapsize = revstart - prevend
	577	316	# only consider holes that are large enough
	578	317	if gapsize > mingapsize:
	579	318	heapq.heappush(gapsheap, (-gapsize, i))
	580	319
	581	320	prevend = revstart + revlen
	582	321
	583	322	# Collect the indices of the largest holes until the density is acceptable
	584	323	indicesheap = []
	585	324	heapq.heapify(indicesheap)
	586	325	while gapsheap and density < targetdensity:
	587	326	oppgapsize, gapidx = heapq.heappop(gapsheap)
	588	327
	589	328	heapq.heappush(indicesheap, gapidx)
	590	329
	591	330	# the gap sizes are stored as negatives to be sorted decreasingly
	592	331	# by the heap
	593	332	readdata -= (-oppgapsize)
	594	333	if readdata > 0:
	595	334	density = chainpayload / float(readdata)
	596	335	else:
	597	336	density = 1.0
	598	337
	599	338	# Cut the revs at collected indices
	600	339	previdx = 0
	601	340	while indicesheap:
	602	341	idx = heapq.heappop(indicesheap)
	603	342
	604	343	chunk = _trimchunk(revlog, revs, previdx, idx)
	605	344	if chunk:
	606	345	yield chunk
	607	346
	608	347	previdx = idx
	609	348
	610	349	chunk = _trimchunk(revlog, revs, previdx)
	611	350	if chunk:
	612	351	yield chunk
	613	352
		353	def _trimchunk(revlog, revs, startidx, endidx=None):
		354	"""returns revs[startidx:endidx] without empty trailing revs
		355
		356	Doctest Setup
		357	>>> revlog = _testrevlog([
		358	... 5, #0
		359	... 10, #1
		360	... 12, #2
		361	... 12, #3 (empty)
		362	... 17, #4
		363	... 21, #5
		364	... 21, #6 (empty)
		365	... ])
		366
		367	Contiguous cases:
		368	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0)
		369	[0, 1, 2, 3, 4, 5]
		370	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 5)
		371	[0, 1, 2, 3, 4]
		372	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 0, 4)
		373	[0, 1, 2]
		374	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 2, 4)
		375	[2]
		376	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3)
		377	[3, 4, 5]
		378	>>> _trimchunk(revlog, [0, 1, 2, 3, 4, 5, 6], 3, 5)
		379	[3, 4]
		380
		381	Discontiguous cases:
		382	>>> _trimchunk(revlog, [1, 3, 5, 6], 0)
		383	[1, 3, 5]
		384	>>> _trimchunk(revlog, [1, 3, 5, 6], 0, 2)
		385	[1]
		386	>>> _trimchunk(revlog, [1, 3, 5, 6], 1, 3)
		387	[3, 5]
		388	>>> _trimchunk(revlog, [1, 3, 5, 6], 1)
		389	[3, 5]
		390	"""
		391	length = revlog.length
		392
		393	if endidx is None:
		394	endidx = len(revs)
		395
		396	# If we have a non-emtpy delta candidate, there are nothing to trim
		397	if revs[endidx - 1] < len(revlog):
		398	# Trim empty revs at the end, except the very first revision of a chain
		399	while (endidx > 1
		400	and endidx > startidx
		401	and length(revs[endidx - 1]) == 0):
		402	endidx -= 1
		403
		404	return revs[startidx:endidx]
		405
		406	def segmentspan(revlog, revs, deltainfo=None):
		407	"""Get the byte span of a segment of revisions
		408
		409	revs is a sorted array of revision numbers
		410
		411	>>> revlog = _testrevlog([
		412	... 5, #0
		413	... 10, #1
		414	... 12, #2
		415	... 12, #3 (empty)
		416	... 17, #4
		417	... ])
		418
		419	>>> segmentspan(revlog, [0, 1, 2, 3, 4])
		420	17
		421	>>> segmentspan(revlog, [0, 4])
		422	17
		423	>>> segmentspan(revlog, [3, 4])
		424	5
		425	>>> segmentspan(revlog, [1, 2, 3,])
		426	7
		427	>>> segmentspan(revlog, [1, 3])
		428	7
		429	"""
		430	if not revs:
		431	return 0
		432	if deltainfo is not None and len(revlog) <= revs[-1]:
		433	if len(revs) == 1:
		434	return deltainfo.deltalen
		435	offset = revlog.end(len(revlog) - 1)
		436	end = deltainfo.deltalen + offset
		437	else:
		438	end = revlog.end(revs[-1])
		439	return end - revlog.start(revs[0])
		440
	614	441	@attr.s(slots=True, frozen=True)
	615	442	class _deltainfo(object):
	616	443	distance = attr.ib()
	617	444	deltalen = attr.ib()
	618	445	data = attr.ib()
	619	446	base = attr.ib()
	620	447	chainbase = attr.ib()
	621	448	chainlen = attr.ib()
	622	449	compresseddeltalen = attr.ib()
	623	450	snapshotdepth = attr.ib()
	624	451
	625		class _deltacomputer(object):
		452	def isgooddeltainfo(revlog, deltainfo, revinfo):
		453	"""Returns True if the given delta is good. Good means that it is within
		454	the disk span, disk size, and chain length bounds that we know to be
		455	performant."""
		456	if deltainfo is None:
		457	return False
		458
		459	# - 'deltainfo.distance' is the distance from the base revision --
		460	# bounding it limits the amount of I/O we need to do.
		461	# - 'deltainfo.compresseddeltalen' is the sum of the total size of
		462	# deltas we need to apply -- bounding it limits the amount of CPU
		463	# we consume.
		464
		465	if revlog._sparserevlog:
		466	# As sparse-read will be used, we can consider that the distance,
		467	# instead of being the span of the whole chunk,
		468	# is the span of the largest read chunk
		469	base = deltainfo.base
		470
		471	if base != nullrev:
		472	deltachain = revlog._deltachain(base)[0]
		473	else:
		474	deltachain = []
		475
		476	# search for the first non-snapshot revision
		477	for idx, r in enumerate(deltachain):
		478	if not revlog.issnapshot(r):
		479	break
		480	deltachain = deltachain[idx:]
		481	chunks = slicechunk(revlog, deltachain, deltainfo)
		482	all_span = [segmentspan(revlog, revs, deltainfo)
		483	for revs in chunks]
		484	distance = max(all_span)
		485	else:
		486	distance = deltainfo.distance
		487
		488	textlen = revinfo.textlen
		489	defaultmax = textlen * 4
		490	maxdist = revlog._maxdeltachainspan
		491	if not maxdist:
		492	maxdist = distance # ensure the conditional pass
		493	maxdist = max(maxdist, defaultmax)
		494	if revlog._sparserevlog and maxdist < revlog._srmingapsize:
		495	# In multiple place, we are ignoring irrelevant data range below a
		496	# certain size. Be also apply this tradeoff here and relax span
		497	# constraint for small enought content.
		498	maxdist = revlog._srmingapsize
		499
		500	# Bad delta from read span:
		501	#
		502	# If the span of data read is larger than the maximum allowed.
		503	if maxdist < distance:
		504	return False
		505
		506	# Bad delta from new delta size:
		507	#
		508	# If the delta size is larger than the target text, storing the
		509	# delta will be inefficient.
		510	if textlen < deltainfo.deltalen:
		511	return False
		512
		513	# Bad delta from cumulated payload size:
		514	#
		515	# If the sum of delta get larger than K * target text length.
		516	if textlen * LIMIT_DELTA2TEXT < deltainfo.compresseddeltalen:
		517	return False
		518
		519	# Bad delta from chain length:
		520	#
		521	# If the number of delta in the chain gets too high.
		522	if (revlog._maxchainlen
		523	and revlog._maxchainlen < deltainfo.chainlen):
		524	return False
		525
		526	# bad delta from intermediate snapshot size limit
		527	#
		528	# If an intermediate snapshot size is higher than the limit. The
		529	# limit exist to prevent endless chain of intermediate delta to be
		530	# created.
		531	if (deltainfo.snapshotdepth is not None and
		532	(textlen >> deltainfo.snapshotdepth) < deltainfo.deltalen):
		533	return False
		534
		535	# bad delta if new intermediate snapshot is larger than the previous
		536	# snapshot
		537	if (deltainfo.snapshotdepth
		538	and revlog.length(deltainfo.base) < deltainfo.deltalen):
		539	return False
		540
		541	return True
		542
		543	class deltacomputer(object):
	626	544	def __init__(self, revlog):
	627	545	self.revlog = revlog
	628	546
	629	547	def _getcandidaterevs(self, p1, p2, cachedelta):
	630	548	"""
	631	549	Provides revisions that present an interest to be diffed against,
	632	550	grouped by level of easiness.
	633	551	"""
	634	552	revlog = self.revlog
	635	553	gdelta = revlog._generaldelta
	636	554	curr = len(revlog)
	637	555	prev = curr - 1
	638	556	p1r, p2r = revlog.rev(p1), revlog.rev(p2)
	639	557
	640	558	# should we try to build a delta?
	641	559	if prev != nullrev and revlog._storedeltachains:
	642	560	tested = set()
	643	561	# This condition is true most of the time when processing
	644	562	# changegroup data into a generaldelta repo. The only time it
	645	563	# isn't true is if this is the first revision in a delta chain
	646	564	# or if ``format.generaldelta=true`` disabled ``lazydeltabase``.
	647	565	if cachedelta and gdelta and revlog._lazydeltabase:
	648	566	# Assume what we received from the server is a good choice
	649	567	# build delta will reuse the cache
	650	568	yield (cachedelta[0],)
	651	569	tested.add(cachedelta[0])
	652	570
	653	571	if gdelta:
	654	572	# exclude already lazy tested base if any
	655	573	parents = [p for p in (p1r, p2r)
	656	574	if p != nullrev and p not in tested]
	657	575
	658	576	if not revlog._deltabothparents and len(parents) == 2:
	659	577	parents.sort()
	660	578	# To minimize the chance of having to build a fulltext,
	661	579	# pick first whichever parent is closest to us (max rev)
	662	580	yield (parents[1],)
	663	581	# then the other one (min rev) if the first did not fit
	664	582	yield (parents[0],)
	665	583	tested.update(parents)
	666	584	elif len(parents) > 0:
	667	585	# Test all parents (1 or 2), and keep the best candidate
	668	586	yield parents
	669	587	tested.update(parents)
	670	588
	671	589	if prev not in tested:
	672	590	# other approach failed try against prev to hopefully save us a
	673	591	# fulltext.
	674	592	yield (prev,)
	675	593	tested.add(prev)
	676	594
	677	595	def buildtext(self, revinfo, fh):
	678	596	"""Builds a fulltext version of a revision
	679	597
	680	598	revinfo: _revisioninfo instance that contains all needed info
	681	599	fh: file handle to either the .i or the .d revlog file,
	682	600	depending on whether it is inlined or not
	683	601	"""
	684	602	btext = revinfo.btext
	685	603	if btext[0] is not None:
	686	604	return btext[0]
	687	605
	688	606	revlog = self.revlog
	689	607	cachedelta = revinfo.cachedelta
	690	608	flags = revinfo.flags
	691	609	node = revinfo.node
	692	610
	693	611	baserev = cachedelta[0]
	694	612	delta = cachedelta[1]
	695	613	# special case deltas which replace entire base; no need to decode
	696	614	# base revision. this neatly avoids censored bases, which throw when
	697	615	# they're decoded.
	698	616	hlen = struct.calcsize(">lll")
	699	617	if delta[:hlen] == mdiff.replacediffheader(revlog.rawsize(baserev),
	700	618	len(delta) - hlen):
	701	619	btext[0] = delta[hlen:]
	702	620	else:
	703	621	# deltabase is rawtext before changed by flag processors, which is
	704	622	# equivalent to non-raw text
	705	623	basetext = revlog.revision(baserev, _df=fh, raw=False)
	706	624	btext[0] = mdiff.patch(basetext, delta)
	707	625
	708	626	try:
	709	627	res = revlog._processflags(btext[0], flags, 'read', raw=True)
	710	628	btext[0], validatehash = res
	711	629	if validatehash:
	712	630	revlog.checkhash(btext[0], node, p1=revinfo.p1, p2=revinfo.p2)
	713	631	if flags & REVIDX_ISCENSORED:
	714	632	raise RevlogError(_('node %s is not censored') % node)
	715	633	except CensoredNodeError:
	716	634	# must pass the censored index flag to add censored revisions
	717	635	if not flags & REVIDX_ISCENSORED:
	718	636	raise
	719	637	return btext[0]
	720	638
	721	639	def _builddeltadiff(self, base, revinfo, fh):
	722	640	revlog = self.revlog
	723	641	t = self.buildtext(revinfo, fh)
	724	642	if revlog.iscensored(base):
	725	643	# deltas based on a censored revision must replace the
	726	644	# full content in one patch, so delta works everywhere
	727	645	header = mdiff.replacediffheader(revlog.rawsize(base), len(t))
	728	646	delta = header + t
	729	647	else:
	730	648	ptext = revlog.revision(base, _df=fh, raw=True)
	731	649	delta = mdiff.textdiff(ptext, t)
	732	650
	733	651	return delta
	734	652
	735	653	def _builddeltainfo(self, revinfo, base, fh):
	736	654	# can we use the cached delta?
	737	655	if revinfo.cachedelta and revinfo.cachedelta[0] == base:
	738	656	delta = revinfo.cachedelta[1]
	739	657	else:
	740	658	delta = self._builddeltadiff(base, revinfo, fh)
	741	659	revlog = self.revlog
	742	660	header, data = revlog.compress(delta)
	743	661	deltalen = len(header) + len(data)
	744	662	chainbase = revlog.chainbase(base)
	745	663	offset = revlog.end(len(revlog) - 1)
	746	664	dist = deltalen + offset - revlog.start(chainbase)
	747	665	if revlog._generaldelta:
	748	666	deltabase = base
	749	667	else:
	750	668	deltabase = chainbase
	751	669	chainlen, compresseddeltalen = revlog._chaininfo(base)
	752	670	chainlen += 1
	753	671	compresseddeltalen += deltalen
	754	672
	755	673	revlog = self.revlog
	756	674	snapshotdepth = None
	757	675	if deltabase == nullrev:
	758	676	snapshotdepth = 0
	759	677	elif revlog._sparserevlog and revlog.issnapshot(deltabase):
	760	678	# A delta chain should always be one full snapshot,
	761	679	# zero or more semi-snapshots, and zero or more deltas
	762	680	p1, p2 = revlog.rev(revinfo.p1), revlog.rev(revinfo.p2)
	763	681	if deltabase not in (p1, p2) and revlog.issnapshot(deltabase):
	764	682	snapshotdepth = len(revlog._deltachain(deltabase)[0])
	765	683
	766	684	return _deltainfo(dist, deltalen, (header, data), deltabase,
	767	685	chainbase, chainlen, compresseddeltalen,
	768	686	snapshotdepth)
	769	687
	770	688	def finddeltainfo(self, revinfo, fh):
	771	689	"""Find an acceptable delta against a candidate revision
	772	690
	773	691	revinfo: information about the revision (instance of _revisioninfo)
	774	692	fh: file handle to either the .i or the .d revlog file,
	775	693	depending on whether it is inlined or not
	776	694
	777	695	Returns the first acceptable candidate revision, as ordered by
	778	696	_getcandidaterevs
	779	697	"""
	780	698	if not revinfo.textlen:
	781	699	return None # empty file do not need delta
	782	700
	783	701	cachedelta = revinfo.cachedelta
	784	702	p1 = revinfo.p1
	785	703	p2 = revinfo.p2
	786	704	revlog = self.revlog
	787	705
	788	706	deltalength = self.revlog.length
	789	707	deltaparent = self.revlog.deltaparent
	790	708
	791	709	deltainfo = None
	792	710	deltas_limit = revinfo.textlen * LIMIT_DELTA2TEXT
	793	711	for candidaterevs in self._getcandidaterevs(p1, p2, cachedelta):
	794	712	# filter out delta base that will never produce good delta
	795	713	candidaterevs = [r for r in candidaterevs
	796	714	if self.revlog.length(r) <= deltas_limit]
	797	715	nominateddeltas = []
	798	716	for candidaterev in candidaterevs:
	799	717	# skip over empty delta (no need to include them in a chain)
	800	718	while candidaterev != nullrev and not deltalength(candidaterev):
	801	719	candidaterev = deltaparent(candidaterev)
	802	720	# no need to try a delta against nullid, this will be handled
	803	721	# by fulltext later.
	804	722	if candidaterev == nullrev:
	805	723	continue
	806	724	# no delta for rawtext-changing revs (see "candelta" for why)
	807	725	if revlog.flags(candidaterev) & REVIDX_RAWTEXT_CHANGING_FLAGS:
	808	726	continue
	809	727	candidatedelta = self._builddeltainfo(revinfo, candidaterev, fh)
	810		if revlog.~~_isgooddeltainfo~~(candidatedelta, revinfo):
		728	if isgooddeltainfo(self.revlog, candidatedelta, revinfo):
	811	729	nominateddeltas.append(candidatedelta)
	812	730	if nominateddeltas:
	813	731	deltainfo = min(nominateddeltas, key=lambda x: x.deltalen)
	814	732	break
	815	733
	816	734	return deltainfo
	817
	818		@attr.s(slots=True, frozen=True)
	819		class _revisioninfo(object):
	820		"""Information about a revision that allows building its fulltext
	821		node: expected hash of the revision
	822		p1, p2: parent revs of the revision
	823		btext: built text cache consisting of a one-element list
	824		cachedelta: (baserev, uncompressed_delta) or None
	825		flags: flags associated to the revision storage
	826
	827		One of btext[0] or cachedelta must be set.
	828		"""
	829		node = attr.ib()
	830		p1 = attr.ib()
	831		p2 = attr.ib()
	832		btext = attr.ib()
	833		textlen = attr.ib()
	834		cachedelta = attr.ib()
	835		flags = attr.ib()
	836
	837		@interfaceutil.implementer(repository.irevisiondelta)
	838		@attr.s(slots=True, frozen=True)
	839		class revlogrevisiondelta(object):
	840		node = attr.ib()
	841		p1node = attr.ib()
	842		p2node = attr.ib()
	843		basenode = attr.ib()
	844		linknode = attr.ib()
	845		flags = attr.ib()
	846		baserevisionsize = attr.ib()
	847		revision = attr.ib()
	848		delta = attr.ib()
	849
	850		# index v0:
	851		# 4 bytes: offset
	852		# 4 bytes: compressed length
	853		# 4 bytes: base rev
	854		# 4 bytes: link rev
	855		# 20 bytes: parent 1 nodeid
	856		# 20 bytes: parent 2 nodeid
	857		# 20 bytes: nodeid
	858		indexformatv0 = struct.Struct(">4l20s20s20s")
	859		indexformatv0_pack = indexformatv0.pack
	860		indexformatv0_unpack = indexformatv0.unpack
	861
	862		class revlogoldindex(list):
	863		def __getitem__(self, i):
	864		if i == -1:
	865		return (0, 0, 0, -1, -1, -1, -1, nullid)
	866		return list.__getitem__(self, i)
	867
	868		class revlogoldio(object):
	869		def __init__(self):
	870		self.size = indexformatv0.size
	871
	872		def parseindex(self, data, inline):
	873		s = self.size
	874		index = []
	875		nodemap = {nullid: nullrev}
	876		n = off = 0
	877		l = len(data)
	878		while off + s <= l:
	879		cur = data[off:off + s]
	880		off += s
	881		e = indexformatv0_unpack(cur)
	882		# transform to revlogv1 format
	883		e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
	884		nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
	885		index.append(e2)
	886		nodemap[e[6]] = n
	887		n += 1
	888
	889		return revlogoldindex(index), nodemap, None
	890
	891		def packentry(self, entry, node, version, rev):
	892		if gettype(entry[0]):
	893		raise RevlogError(_('index entry flags need revlog version 1'))
	894		e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
	895		node(entry[5]), node(entry[6]), entry[7])
	896		return indexformatv0_pack(*e2)
	897
	898		# index ng:
	899		# 6 bytes: offset
	900		# 2 bytes: flags
	901		# 4 bytes: compressed length
	902		# 4 bytes: uncompressed length
	903		# 4 bytes: base rev
	904		# 4 bytes: link rev
	905		# 4 bytes: parent 1 rev
	906		# 4 bytes: parent 2 rev
	907		# 32 bytes: nodeid
	908		indexformatng = struct.Struct(">Qiiiiii20s12x")
	909		indexformatng_pack = indexformatng.pack
	910		versionformat = struct.Struct(">I")
	911		versionformat_pack = versionformat.pack
	912		versionformat_unpack = versionformat.unpack
	913
	914		# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
	915		# signed integer)
	916		_maxentrysize = 0x7fffffff
	917
	918		class revlogio(object):
	919		def __init__(self):
	920		self.size = indexformatng.size
	921
	922		def parseindex(self, data, inline):
	923		# call the C implementation to parse the index data
	924		index, cache = parsers.parse_index2(data, inline)
	925		return index, getattr(index, 'nodemap', None), cache
	926
	927		def packentry(self, entry, node, version, rev):
	928		p = indexformatng_pack(*entry)
	929		if rev == 0:
	930		p = versionformat_pack(version) + p[4:]
	931		return p
	932
	933		class revlog(object):
	934		"""
	935		the underlying revision storage object
	936
	937		A revlog consists of two parts, an index and the revision data.
	938
	939		The index is a file with a fixed record size containing
	940		information on each revision, including its nodeid (hash), the
	941		nodeids of its parents, the position and offset of its data within
	942		the data file, and the revision it's based on. Finally, each entry
	943		contains a linkrev entry that can serve as a pointer to external
	944		data.
	945
	946		The revision data itself is a linear collection of data chunks.
	947		Each chunk represents a revision and is usually represented as a
	948		delta against the previous chunk. To bound lookup time, runs of
	949		deltas are limited to about 2 times the length of the original
	950		version data. This makes retrieval of a version proportional to
	951		its size, or O(1) relative to the number of revisions.
	952
	953		Both pieces of the revlog are written to in an append-only
	954		fashion, which means we never need to rewrite a file to insert or
	955		remove data, and can use some simple techniques to avoid the need
	956		for locking while reading.
	957
	958		If checkambig, indexfile is opened with checkambig=True at
	959		writing, to avoid file stat ambiguity.
	960
	961		If mmaplargeindex is True, and an mmapindexthreshold is set, the
	962		index will be mmapped rather than read if it is larger than the
	963		configured threshold.
	964
	965		If censorable is True, the revlog can have censored revisions.
	966		"""
	967		def __init__(self, opener, indexfile, datafile=None, checkambig=False,
	968		mmaplargeindex=False, censorable=False):
	969		"""
	970		create a revlog object
	971
	972		opener is a function that abstracts the file opening operation
	973		and can be used to implement COW semantics or the like.
	974		"""
	975		self.indexfile = indexfile
	976		self.datafile = datafile or (indexfile[:-2] + ".d")
	977		self.opener = opener
	978		# When True, indexfile is opened with checkambig=True at writing, to
	979		# avoid file stat ambiguity.
	980		self._checkambig = checkambig
	981		self._censorable = censorable
	982		# 3-tuple of (node, rev, text) for a raw revision.
	983		self._cache = None
	984		# Maps rev to chain base rev.
	985		self._chainbasecache = util.lrucachedict(100)
	986		# 2-tuple of (offset, data) of raw data from the revlog at an offset.
	987		self._chunkcache = (0, '')
	988		# How much data to read and cache into the raw revlog data cache.
	989		self._chunkcachesize = 65536
	990		self._maxchainlen = None
	991		self._deltabothparents = True
	992		self.index = []
	993		# Mapping of partial identifiers to full nodes.
	994		self._pcache = {}
	995		# Mapping of revision integer to full node.
	996		self._nodecache = {nullid: nullrev}
	997		self._nodepos = None
	998		self._compengine = 'zlib'
	999		self._maxdeltachainspan = -1
	1000		self._withsparseread = False
	1001		self._sparserevlog = False
	1002		self._srdensitythreshold = 0.50
	1003		self._srmingapsize = 262144
	1004
	1005		mmapindexthreshold = None
	1006		v = REVLOG_DEFAULT_VERSION
	1007		opts = getattr(opener, 'options', None)
	1008		if opts is not None:
	1009		if 'revlogv2' in opts:
	1010		# version 2 revlogs always use generaldelta.
	1011		v = REVLOGV2 \| FLAG_GENERALDELTA \| FLAG_INLINE_DATA
	1012		elif 'revlogv1' in opts:
	1013		if 'generaldelta' in opts:
	1014		v \|= FLAG_GENERALDELTA
	1015		else:
	1016		v = 0
	1017		if 'chunkcachesize' in opts:
	1018		self._chunkcachesize = opts['chunkcachesize']
	1019		if 'maxchainlen' in opts:
	1020		self._maxchainlen = opts['maxchainlen']
	1021		if 'deltabothparents' in opts:
	1022		self._deltabothparents = opts['deltabothparents']
	1023		self._lazydeltabase = bool(opts.get('lazydeltabase', False))
	1024		if 'compengine' in opts:
	1025		self._compengine = opts['compengine']
	1026		if 'maxdeltachainspan' in opts:
	1027		self._maxdeltachainspan = opts['maxdeltachainspan']
	1028		if mmaplargeindex and 'mmapindexthreshold' in opts:
	1029		mmapindexthreshold = opts['mmapindexthreshold']
	1030		self._sparserevlog = bool(opts.get('sparse-revlog', False))
	1031		withsparseread = bool(opts.get('with-sparse-read', False))
	1032		# sparse-revlog forces sparse-read
	1033		self._withsparseread = self._sparserevlog or withsparseread
	1034		if 'sparse-read-density-threshold' in opts:
	1035		self._srdensitythreshold = opts['sparse-read-density-threshold']
	1036		if 'sparse-read-min-gap-size' in opts:
	1037		self._srmingapsize = opts['sparse-read-min-gap-size']
	1038
	1039		if self._chunkcachesize <= 0:
	1040		raise RevlogError(_('revlog chunk cache size %r is not greater '
	1041		'than 0') % self._chunkcachesize)
	1042		elif self._chunkcachesize & (self._chunkcachesize - 1):
	1043		raise RevlogError(_('revlog chunk cache size %r is not a power '
	1044		'of 2') % self._chunkcachesize)
	1045
	1046		indexdata = ''
	1047		self._initempty = True
	1048		try:
	1049		with self._indexfp() as f:
	1050		if (mmapindexthreshold is not None and
	1051		self.opener.fstat(f).st_size >= mmapindexthreshold):
	1052		indexdata = util.buffer(util.mmapread(f))
	1053		else:
	1054		indexdata = f.read()
	1055		if len(indexdata) > 0:
	1056		v = versionformat_unpack(indexdata[:4])[0]
	1057		self._initempty = False
	1058		except IOError as inst:
	1059		if inst.errno != errno.ENOENT:
	1060		raise
	1061
	1062		self.version = v
	1063		self._inline = v & FLAG_INLINE_DATA
	1064		self._generaldelta = v & FLAG_GENERALDELTA
	1065		flags = v & ~0xFFFF
	1066		fmt = v & 0xFFFF
	1067		if fmt == REVLOGV0:
	1068		if flags:
	1069		raise RevlogError(_('unknown flags (%#04x) in version %d '
	1070		'revlog %s') %
	1071		(flags >> 16, fmt, self.indexfile))
	1072		elif fmt == REVLOGV1:
	1073		if flags & ~REVLOGV1_FLAGS:
	1074		raise RevlogError(_('unknown flags (%#04x) in version %d '
	1075		'revlog %s') %
	1076		(flags >> 16, fmt, self.indexfile))
	1077		elif fmt == REVLOGV2:
	1078		if flags & ~REVLOGV2_FLAGS:
	1079		raise RevlogError(_('unknown flags (%#04x) in version %d '
	1080		'revlog %s') %
	1081		(flags >> 16, fmt, self.indexfile))
	1082		else:
	1083		raise RevlogError(_('unknown version (%d) in revlog %s') %
	1084		(fmt, self.indexfile))
	1085
	1086		self._storedeltachains = True
	1087
	1088		self._io = revlogio()
	1089		if self.version == REVLOGV0:
	1090		self._io = revlogoldio()
	1091		try:
	1092		d = self._io.parseindex(indexdata, self._inline)
	1093		except (ValueError, IndexError):
	1094		raise RevlogError(_("index %s is corrupted") % (self.indexfile))
	1095		self.index, nodemap, self._chunkcache = d
	1096		if nodemap is not None:
	1097		self.nodemap = self._nodecache = nodemap
	1098		if not self._chunkcache:
	1099		self._chunkclear()
	1100		# revnum -> (chain-length, sum-delta-length)
	1101		self._chaininfocache = {}
	1102		# revlog header -> revlog compressor
	1103		self._decompressors = {}
	1104
	1105		@util.propertycache
	1106		def _compressor(self):
	1107		return util.compengines[self._compengine].revlogcompressor()
	1108
	1109		def _indexfp(self, mode='r'):
	1110		"""file object for the revlog's index file"""
	1111		args = {r'mode': mode}
	1112		if mode != 'r':
	1113		args[r'checkambig'] = self._checkambig
	1114		if mode == 'w':
	1115		args[r'atomictemp'] = True
	1116		return self.opener(self.indexfile, **args)
	1117
	1118		def _datafp(self, mode='r'):
	1119		"""file object for the revlog's data file"""
	1120		return self.opener(self.datafile, mode=mode)
	1121
	1122		@contextlib.contextmanager
	1123		def _datareadfp(self, existingfp=None):
	1124		"""file object suitable to read data"""
	1125		if existingfp is not None:
	1126		yield existingfp
	1127		else:
	1128		if self._inline:
	1129		func = self._indexfp
	1130		else:
	1131		func = self._datafp
	1132		with func() as fp:
	1133		yield fp
	1134
	1135		def tip(self):
	1136		return self.node(len(self.index) - 1)
	1137		def __contains__(self, rev):
	1138		return 0 <= rev < len(self)
	1139		def __len__(self):
	1140		return len(self.index)
	1141		def __iter__(self):
	1142		return iter(pycompat.xrange(len(self)))
	1143		def revs(self, start=0, stop=None):
	1144		"""iterate over all rev in this revlog (from start to stop)"""
	1145		step = 1
	1146		length = len(self)
	1147		if stop is not None:
	1148		if start > stop:
	1149		step = -1
	1150		stop += step
	1151		if stop > length:
	1152		stop = length
	1153		else:
	1154		stop = length
	1155		return pycompat.xrange(start, stop, step)
	1156
	1157		@util.propertycache
	1158		def nodemap(self):
	1159		if self.index:
	1160		# populate mapping down to the initial node
	1161		node0 = self.index[0][7] # get around changelog filtering
	1162		self.rev(node0)
	1163		return self._nodecache
	1164
	1165		def hasnode(self, node):
	1166		try:
	1167		self.rev(node)
	1168		return True
	1169		except KeyError:
	1170		return False
	1171
	1172		def candelta(self, baserev, rev):
	1173		"""whether two revisions (baserev, rev) can be delta-ed or not"""
	1174		# Disable delta if either rev requires a content-changing flag
	1175		# processor (ex. LFS). This is because such flag processor can alter
	1176		# the rawtext content that the delta will be based on, and two clients
	1177		# could have a same revlog node with different flags (i.e. different
	1178		# rawtext contents) and the delta could be incompatible.
	1179		if ((self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS)
	1180		or (self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS)):
	1181		return False
	1182		return True
	1183
	1184		def clearcaches(self):
	1185		self._cache = None
	1186		self._chainbasecache.clear()
	1187		self._chunkcache = (0, '')
	1188		self._pcache = {}
	1189
	1190		try:
	1191		self._nodecache.clearcaches()
	1192		except AttributeError:
	1193		self._nodecache = {nullid: nullrev}
	1194		self._nodepos = None
	1195
	1196		def rev(self, node):
	1197		try:
	1198		return self._nodecache[node]
	1199		except TypeError:
	1200		raise
	1201		except RevlogError:
	1202		# parsers.c radix tree lookup failed
	1203		if node == wdirid or node in wdirfilenodeids:
	1204		raise error.WdirUnsupported
	1205		raise LookupError(node, self.indexfile, _('no node'))
	1206		except KeyError:
	1207		# pure python cache lookup failed
	1208		n = self._nodecache
	1209		i = self.index
	1210		p = self._nodepos
	1211		if p is None:
	1212		p = len(i) - 1
	1213		else:
	1214		assert p < len(i)
	1215		for r in pycompat.xrange(p, -1, -1):
	1216		v = i[r][7]
	1217		n[v] = r
	1218		if v == node:
	1219		self._nodepos = r - 1
	1220		return r
	1221		if node == wdirid or node in wdirfilenodeids:
	1222		raise error.WdirUnsupported
	1223		raise LookupError(node, self.indexfile, _('no node'))
	1224
	1225		# Accessors for index entries.
	1226
	1227		# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
	1228		# are flags.
	1229		def start(self, rev):
	1230		return int(self.index[rev][0] >> 16)
	1231
	1232		def flags(self, rev):
	1233		return self.index[rev][0] & 0xFFFF
	1234
	1235		def length(self, rev):
	1236		return self.index[rev][1]
	1237
	1238		def rawsize(self, rev):
	1239		"""return the length of the uncompressed text for a given revision"""
	1240		l = self.index[rev][2]
	1241		if l >= 0:
	1242		return l
	1243
	1244		t = self.revision(rev, raw=True)
	1245		return len(t)
	1246
	1247		def size(self, rev):
	1248		"""length of non-raw text (processed by a "read" flag processor)"""
	1249		# fast path: if no "read" flag processor could change the content,
	1250		# size is rawsize. note: ELLIPSIS is known to not change the content.
	1251		flags = self.flags(rev)
	1252		if flags & (REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
	1253		return self.rawsize(rev)
	1254
	1255		return len(self.revision(rev, raw=False))
	1256
	1257		def chainbase(self, rev):
	1258		base = self._chainbasecache.get(rev)
	1259		if base is not None:
	1260		return base
	1261
	1262		index = self.index
	1263		iterrev = rev
	1264		base = index[iterrev][3]
	1265		while base != iterrev:
	1266		iterrev = base
	1267		base = index[iterrev][3]
	1268
	1269		self._chainbasecache[rev] = base
	1270		return base
	1271
	1272		def linkrev(self, rev):
	1273		return self.index[rev][4]
	1274
	1275		def parentrevs(self, rev):
	1276		try:
	1277		entry = self.index[rev]
	1278		except IndexError:
	1279		if rev == wdirrev:
	1280		raise error.WdirUnsupported
	1281		raise
	1282
	1283		return entry[5], entry[6]
	1284
	1285		def node(self, rev):
	1286		try:
	1287		return self.index[rev][7]
	1288		except IndexError:
	1289		if rev == wdirrev:
	1290		raise error.WdirUnsupported
	1291		raise
	1292
	1293		# Derived from index values.
	1294
	1295		def end(self, rev):
	1296		return self.start(rev) + self.length(rev)
	1297
	1298		def parents(self, node):
	1299		i = self.index
	1300		d = i[self.rev(node)]
	1301		return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
	1302
	1303		def chainlen(self, rev):
	1304		return self._chaininfo(rev)[0]
	1305
	1306		def _chaininfo(self, rev):
	1307		chaininfocache = self._chaininfocache
	1308		if rev in chaininfocache:
	1309		return chaininfocache[rev]
	1310		index = self.index
	1311		generaldelta = self._generaldelta
	1312		iterrev = rev
	1313		e = index[iterrev]
	1314		clen = 0
	1315		compresseddeltalen = 0
	1316		while iterrev != e[3]:
	1317		clen += 1
	1318		compresseddeltalen += e[1]
	1319		if generaldelta:
	1320		iterrev = e[3]
	1321		else:
	1322		iterrev -= 1
	1323		if iterrev in chaininfocache:
	1324		t = chaininfocache[iterrev]
	1325		clen += t[0]
	1326		compresseddeltalen += t[1]
	1327		break
	1328		e = index[iterrev]
	1329		else:
	1330		# Add text length of base since decompressing that also takes
	1331		# work. For cache hits the length is already included.
	1332		compresseddeltalen += e[1]
	1333		r = (clen, compresseddeltalen)
	1334		chaininfocache[rev] = r
	1335		return r
	1336
	1337		def _deltachain(self, rev, stoprev=None):
	1338		"""Obtain the delta chain for a revision.
	1339
	1340		``stoprev`` specifies a revision to stop at. If not specified, we
	1341		stop at the base of the chain.
	1342
	1343		Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
	1344		revs in ascending order and ``stopped`` is a bool indicating whether
	1345		``stoprev`` was hit.
	1346		"""
	1347		# Try C implementation.
	1348		try:
	1349		return self.index.deltachain(rev, stoprev, self._generaldelta)
	1350		except AttributeError:
	1351		pass
	1352
	1353		chain = []
	1354
	1355		# Alias to prevent attribute lookup in tight loop.
	1356		index = self.index
	1357		generaldelta = self._generaldelta
	1358
	1359		iterrev = rev
	1360		e = index[iterrev]
	1361		while iterrev != e[3] and iterrev != stoprev:
	1362		chain.append(iterrev)
	1363		if generaldelta:
	1364		iterrev = e[3]
	1365		else:
	1366		iterrev -= 1
	1367		e = index[iterrev]
	1368
	1369		if iterrev == stoprev:
	1370		stopped = True
	1371		else:
	1372		chain.append(iterrev)
	1373		stopped = False
	1374
	1375		chain.reverse()
	1376		return chain, stopped
	1377
	1378		def ancestors(self, revs, stoprev=0, inclusive=False):
	1379		"""Generate the ancestors of 'revs' in reverse topological order.
	1380		Does not generate revs lower than stoprev.
	1381
	1382		See the documentation for ancestor.lazyancestors for more details."""
	1383
	1384		return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,
	1385		inclusive=inclusive)
	1386
	1387		def descendants(self, revs):
	1388		"""Generate the descendants of 'revs' in revision order.
	1389
	1390		Yield a sequence of revision numbers starting with a child of
	1391		some rev in revs, i.e., each revision is not considered a
	1392		descendant of itself. Results are ordered by revision number (a
	1393		topological sort)."""
	1394		first = min(revs)
	1395		if first == nullrev:
	1396		for i in self:
	1397		yield i
	1398		return
	1399
	1400		seen = set(revs)
	1401		for i in self.revs(start=first + 1):
	1402		for x in self.parentrevs(i):
	1403		if x != nullrev and x in seen:
	1404		seen.add(i)
	1405		yield i
	1406		break
	1407
	1408		def findcommonmissing(self, common=None, heads=None):
	1409		"""Return a tuple of the ancestors of common and the ancestors of heads
	1410		that are not ancestors of common. In revset terminology, we return the
	1411		tuple:
	1412
	1413		::common, (::heads) - (::common)
	1414
	1415		The list is sorted by revision number, meaning it is
	1416		topologically sorted.
	1417
	1418		'heads' and 'common' are both lists of node IDs. If heads is
	1419		not supplied, uses all of the revlog's heads. If common is not
	1420		supplied, uses nullid."""
	1421		if common is None:
	1422		common = [nullid]
	1423		if heads is None:
	1424		heads = self.heads()
	1425
	1426		common = [self.rev(n) for n in common]
	1427		heads = [self.rev(n) for n in heads]
	1428
	1429		# we want the ancestors, but inclusive
	1430		class lazyset(object):
	1431		def __init__(self, lazyvalues):
	1432		self.addedvalues = set()
	1433		self.lazyvalues = lazyvalues
	1434
	1435		def __contains__(self, value):
	1436		return value in self.addedvalues or value in self.lazyvalues
	1437
	1438		def __iter__(self):
	1439		added = self.addedvalues
	1440		for r in added:
	1441		yield r
	1442		for r in self.lazyvalues:
	1443		if not r in added:
	1444		yield r
	1445
	1446		def add(self, value):
	1447		self.addedvalues.add(value)
	1448
	1449		def update(self, values):
	1450		self.addedvalues.update(values)
	1451
	1452		has = lazyset(self.ancestors(common))
	1453		has.add(nullrev)
	1454		has.update(common)
	1455
	1456		# take all ancestors from heads that aren't in has
	1457		missing = set()
	1458		visit = collections.deque(r for r in heads if r not in has)
	1459		while visit:
	1460		r = visit.popleft()
	1461		if r in missing:
	1462		continue
	1463		else:
	1464		missing.add(r)
	1465		for p in self.parentrevs(r):
	1466		if p not in has:
	1467		visit.append(p)
	1468		missing = list(missing)
	1469		missing.sort()
	1470		return has, [self.node(miss) for miss in missing]
	1471
	1472		def incrementalmissingrevs(self, common=None):
	1473		"""Return an object that can be used to incrementally compute the
	1474		revision numbers of the ancestors of arbitrary sets that are not
	1475		ancestors of common. This is an ancestor.incrementalmissingancestors
	1476		object.
	1477
	1478		'common' is a list of revision numbers. If common is not supplied, uses
	1479		nullrev.
	1480		"""
	1481		if common is None:
	1482		common = [nullrev]
	1483
	1484		return ancestor.incrementalmissingancestors(self.parentrevs, common)
	1485
	1486		def findmissingrevs(self, common=None, heads=None):
	1487		"""Return the revision numbers of the ancestors of heads that
	1488		are not ancestors of common.
	1489
	1490		More specifically, return a list of revision numbers corresponding to
	1491		nodes N such that every N satisfies the following constraints:
	1492
	1493		1. N is an ancestor of some node in 'heads'
	1494		2. N is not an ancestor of any node in 'common'
	1495
	1496		The list is sorted by revision number, meaning it is
	1497		topologically sorted.
	1498
	1499		'heads' and 'common' are both lists of revision numbers. If heads is
	1500		not supplied, uses all of the revlog's heads. If common is not
	1501		supplied, uses nullid."""
	1502		if common is None:
	1503		common = [nullrev]
	1504		if heads is None:
	1505		heads = self.headrevs()
	1506
	1507		inc = self.incrementalmissingrevs(common=common)
	1508		return inc.missingancestors(heads)
	1509
	1510		def findmissing(self, common=None, heads=None):
	1511		"""Return the ancestors of heads that are not ancestors of common.
	1512
	1513		More specifically, return a list of nodes N such that every N
	1514		satisfies the following constraints:
	1515
	1516		1. N is an ancestor of some node in 'heads'
	1517		2. N is not an ancestor of any node in 'common'
	1518
	1519		The list is sorted by revision number, meaning it is
	1520		topologically sorted.
	1521
	1522		'heads' and 'common' are both lists of node IDs. If heads is
	1523		not supplied, uses all of the revlog's heads. If common is not
	1524		supplied, uses nullid."""
	1525		if common is None:
	1526		common = [nullid]
	1527		if heads is None:
	1528		heads = self.heads()
	1529
	1530		common = [self.rev(n) for n in common]
	1531		heads = [self.rev(n) for n in heads]
	1532
	1533		inc = self.incrementalmissingrevs(common=common)
	1534		return [self.node(r) for r in inc.missingancestors(heads)]
	1535
	1536		def nodesbetween(self, roots=None, heads=None):
	1537		"""Return a topological path from 'roots' to 'heads'.
	1538
	1539		Return a tuple (nodes, outroots, outheads) where 'nodes' is a
	1540		topologically sorted list of all nodes N that satisfy both of
	1541		these constraints:
	1542
	1543		1. N is a descendant of some node in 'roots'
	1544		2. N is an ancestor of some node in 'heads'
	1545
	1546		Every node is considered to be both a descendant and an ancestor
	1547		of itself, so every reachable node in 'roots' and 'heads' will be
	1548		included in 'nodes'.
	1549
	1550		'outroots' is the list of reachable nodes in 'roots', i.e., the
	1551		subset of 'roots' that is returned in 'nodes'. Likewise,
	1552		'outheads' is the subset of 'heads' that is also in 'nodes'.
	1553
	1554		'roots' and 'heads' are both lists of node IDs. If 'roots' is
	1555		unspecified, uses nullid as the only root. If 'heads' is
	1556		unspecified, uses list of all of the revlog's heads."""
	1557		nonodes = ([], [], [])
	1558		if roots is not None:
	1559		roots = list(roots)
	1560		if not roots:
	1561		return nonodes
	1562		lowestrev = min([self.rev(n) for n in roots])
	1563		else:
	1564		roots = [nullid] # Everybody's a descendant of nullid
	1565		lowestrev = nullrev
	1566		if (lowestrev == nullrev) and (heads is None):
	1567		# We want _all_ the nodes!
	1568		return ([self.node(r) for r in self], [nullid], list(self.heads()))
	1569		if heads is None:
	1570		# All nodes are ancestors, so the latest ancestor is the last
	1571		# node.
	1572		highestrev = len(self) - 1
	1573		# Set ancestors to None to signal that every node is an ancestor.
	1574		ancestors = None
	1575		# Set heads to an empty dictionary for later discovery of heads
	1576		heads = {}
	1577		else:
	1578		heads = list(heads)
	1579		if not heads:
	1580		return nonodes
	1581		ancestors = set()
	1582		# Turn heads into a dictionary so we can remove 'fake' heads.
	1583		# Also, later we will be using it to filter out the heads we can't
	1584		# find from roots.
	1585		heads = dict.fromkeys(heads, False)
	1586		# Start at the top and keep marking parents until we're done.
	1587		nodestotag = set(heads)
	1588		# Remember where the top was so we can use it as a limit later.
	1589		highestrev = max([self.rev(n) for n in nodestotag])
	1590		while nodestotag:
	1591		# grab a node to tag
	1592		n = nodestotag.pop()
	1593		# Never tag nullid
	1594		if n == nullid:
	1595		continue
	1596		# A node's revision number represents its place in a
	1597		# topologically sorted list of nodes.
	1598		r = self.rev(n)
	1599		if r >= lowestrev:
	1600		if n not in ancestors:
	1601		# If we are possibly a descendant of one of the roots
	1602		# and we haven't already been marked as an ancestor
	1603		ancestors.add(n) # Mark as ancestor
	1604		# Add non-nullid parents to list of nodes to tag.
	1605		nodestotag.update([p for p in self.parents(n) if
	1606		p != nullid])
	1607		elif n in heads: # We've seen it before, is it a fake head?
	1608		# So it is, real heads should not be the ancestors of
	1609		# any other heads.
	1610		heads.pop(n)
	1611		if not ancestors:
	1612		return nonodes
	1613		# Now that we have our set of ancestors, we want to remove any
	1614		# roots that are not ancestors.
	1615
	1616		# If one of the roots was nullid, everything is included anyway.
	1617		if lowestrev > nullrev:
	1618		# But, since we weren't, let's recompute the lowest rev to not
	1619		# include roots that aren't ancestors.
	1620
	1621		# Filter out roots that aren't ancestors of heads
	1622		roots = [root for root in roots if root in ancestors]
	1623		# Recompute the lowest revision
	1624		if roots:
	1625		lowestrev = min([self.rev(root) for root in roots])
	1626		else:
	1627		# No more roots? Return empty list
	1628		return nonodes
	1629		else:
	1630		# We are descending from nullid, and don't need to care about
	1631		# any other roots.
	1632		lowestrev = nullrev
	1633		roots = [nullid]
	1634		# Transform our roots list into a set.
	1635		descendants = set(roots)
	1636		# Also, keep the original roots so we can filter out roots that aren't
	1637		# 'real' roots (i.e. are descended from other roots).
	1638		roots = descendants.copy()
	1639		# Our topologically sorted list of output nodes.
	1640		orderedout = []
	1641		# Don't start at nullid since we don't want nullid in our output list,
	1642		# and if nullid shows up in descendants, empty parents will look like
	1643		# they're descendants.
	1644		for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
	1645		n = self.node(r)
	1646		isdescendant = False
	1647		if lowestrev == nullrev: # Everybody is a descendant of nullid
	1648		isdescendant = True
	1649		elif n in descendants:
	1650		# n is already a descendant
	1651		isdescendant = True
	1652		# This check only needs to be done here because all the roots
	1653		# will start being marked is descendants before the loop.
	1654		if n in roots:
	1655		# If n was a root, check if it's a 'real' root.
	1656		p = tuple(self.parents(n))
	1657		# If any of its parents are descendants, it's not a root.
	1658		if (p[0] in descendants) or (p[1] in descendants):
	1659		roots.remove(n)
	1660		else:
	1661		p = tuple(self.parents(n))
	1662		# A node is a descendant if either of its parents are
	1663		# descendants. (We seeded the dependents list with the roots
	1664		# up there, remember?)
	1665		if (p[0] in descendants) or (p[1] in descendants):
	1666		descendants.add(n)
	1667		isdescendant = True
	1668		if isdescendant and ((ancestors is None) or (n in ancestors)):
	1669		# Only include nodes that are both descendants and ancestors.
	1670		orderedout.append(n)
	1671		if (ancestors is not None) and (n in heads):
	1672		# We're trying to figure out which heads are reachable
	1673		# from roots.
	1674		# Mark this head as having been reached
	1675		heads[n] = True
	1676		elif ancestors is None:
	1677		# Otherwise, we're trying to discover the heads.
	1678		# Assume this is a head because if it isn't, the next step
	1679		# will eventually remove it.
	1680		heads[n] = True
	1681		# But, obviously its parents aren't.
	1682		for p in self.parents(n):
	1683		heads.pop(p, None)
	1684		heads = [head for head, flag in heads.iteritems() if flag]
	1685		roots = list(roots)
	1686		assert orderedout
	1687		assert roots
	1688		assert heads
	1689		return (orderedout, roots, heads)
	1690
	1691		def headrevs(self):
	1692		try:
	1693		return self.index.headrevs()
	1694		except AttributeError:
	1695		return self._headrevs()
	1696
	1697		def computephases(self, roots):
	1698		return self.index.computephasesmapsets(roots)
	1699
	1700		def _headrevs(self):
	1701		count = len(self)
	1702		if not count:
	1703		return [nullrev]
	1704		# we won't iter over filtered rev so nobody is a head at start
	1705		ishead = [0] * (count + 1)
	1706		index = self.index
	1707		for r in self:
	1708		ishead[r] = 1 # I may be an head
	1709		e = index[r]
	1710		ishead[e[5]] = ishead[e[6]] = 0 # my parent are not
	1711		return [r for r, val in enumerate(ishead) if val]
	1712
	1713		def heads(self, start=None, stop=None):
	1714		"""return the list of all nodes that have no children
	1715
	1716		if start is specified, only heads that are descendants of
	1717		start will be returned
	1718		if stop is specified, it will consider all the revs from stop
	1719		as if they had no children
	1720		"""
	1721		if start is None and stop is None:
	1722		if not len(self):
	1723		return [nullid]
	1724		return [self.node(r) for r in self.headrevs()]
	1725
	1726		if start is None:
	1727		start = nullid
	1728		if stop is None:
	1729		stop = []
	1730		stoprevs = set([self.rev(n) for n in stop])
	1731		startrev = self.rev(start)
	1732		reachable = {startrev}
	1733		heads = {startrev}
	1734
	1735		parentrevs = self.parentrevs
	1736		for r in self.revs(start=startrev + 1):
	1737		for p in parentrevs(r):
	1738		if p in reachable:
	1739		if r not in stoprevs:
	1740		reachable.add(r)
	1741		heads.add(r)
	1742		if p in heads and p not in stoprevs:
	1743		heads.remove(p)
	1744
	1745		return [self.node(r) for r in heads]
	1746
	1747		def children(self, node):
	1748		"""find the children of a given node"""
	1749		c = []
	1750		p = self.rev(node)
	1751		for r in self.revs(start=p + 1):
	1752		prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
	1753		if prevs:
	1754		for pr in prevs:
	1755		if pr == p:
	1756		c.append(self.node(r))
	1757		elif p == nullrev:
	1758		c.append(self.node(r))
	1759		return c
	1760
	1761		def commonancestorsheads(self, a, b):
	1762		"""calculate all the heads of the common ancestors of nodes a and b"""
	1763		a, b = self.rev(a), self.rev(b)
	1764		ancs = self._commonancestorsheads(a, b)
	1765		return pycompat.maplist(self.node, ancs)
	1766
	1767		def _commonancestorsheads(self, *revs):
	1768		"""calculate all the heads of the common ancestors of revs"""
	1769		try:
	1770		ancs = self.index.commonancestorsheads(*revs)
	1771		except (AttributeError, OverflowError): # C implementation failed
	1772		ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
	1773		return ancs
	1774
	1775		def isancestor(self, a, b):
	1776		"""return True if node a is an ancestor of node b
	1777
	1778		A revision is considered an ancestor of itself."""
	1779		a, b = self.rev(a), self.rev(b)
	1780		return self.isancestorrev(a, b)
	1781
	1782		def isancestorrev(self, a, b):
	1783		"""return True if revision a is an ancestor of revision b
	1784
	1785		A revision is considered an ancestor of itself.
	1786
	1787		The implementation of this is trivial but the use of
	1788		commonancestorsheads is not."""
	1789		if a == nullrev:
	1790		return True
	1791		elif a == b:
	1792		return True
	1793		elif a > b:
	1794		return False
	1795		return a in self._commonancestorsheads(a, b)
	1796
	1797		def ancestor(self, a, b):
	1798		"""calculate the "best" common ancestor of nodes a and b"""
	1799
	1800		a, b = self.rev(a), self.rev(b)
	1801		try:
	1802		ancs = self.index.ancestors(a, b)
	1803		except (AttributeError, OverflowError):
	1804		ancs = ancestor.ancestors(self.parentrevs, a, b)
	1805		if ancs:
	1806		# choose a consistent winner when there's a tie
	1807		return min(map(self.node, ancs))
	1808		return nullid
	1809
	1810		def _match(self, id):
	1811		if isinstance(id, int):
	1812		# rev
	1813		return self.node(id)
	1814		if len(id) == 20:
	1815		# possibly a binary node
	1816		# odds of a binary node being all hex in ASCII are 1 in 10**25
	1817		try:
	1818		node = id
	1819		self.rev(node) # quick search the index
	1820		return node
	1821		except LookupError:
	1822		pass # may be partial hex id
	1823		try:
	1824		# str(rev)
	1825		rev = int(id)
	1826		if "%d" % rev != id:
	1827		raise ValueError
	1828		if rev < 0:
	1829		rev = len(self) + rev
	1830		if rev < 0 or rev >= len(self):
	1831		raise ValueError
	1832		return self.node(rev)
	1833		except (ValueError, OverflowError):
	1834		pass
	1835		if len(id) == 40:
	1836		try:
	1837		# a full hex nodeid?
	1838		node = bin(id)
	1839		self.rev(node)
	1840		return node
	1841		except (TypeError, LookupError):
	1842		pass
	1843
	1844		def _partialmatch(self, id):
	1845		# we don't care wdirfilenodeids as they should be always full hash
	1846		maybewdir = wdirhex.startswith(id)
	1847		try:
	1848		partial = self.index.partialmatch(id)
	1849		if partial and self.hasnode(partial):
	1850		if maybewdir:
	1851		# single 'ff...' match in radix tree, ambiguous with wdir
	1852		raise RevlogError
	1853		return partial
	1854		if maybewdir:
	1855		# no 'ff...' match in radix tree, wdir identified
	1856		raise error.WdirUnsupported
	1857		return None
	1858		except RevlogError:
	1859		# parsers.c radix tree lookup gave multiple matches
	1860		# fast path: for unfiltered changelog, radix tree is accurate
	1861		if not getattr(self, 'filteredrevs', None):
	1862		raise AmbiguousPrefixLookupError(id, self.indexfile,
	1863		_('ambiguous identifier'))
	1864		# fall through to slow path that filters hidden revisions
	1865		except (AttributeError, ValueError):
	1866		# we are pure python, or key was too short to search radix tree
	1867		pass
	1868
	1869		if id in self._pcache:
	1870		return self._pcache[id]
	1871
	1872		if len(id) <= 40:
	1873		try:
	1874		# hex(node)[:...]
	1875		l = len(id) // 2 # grab an even number of digits
	1876		prefix = bin(id[:l * 2])
	1877		nl = [e[7] for e in self.index if e[7].startswith(prefix)]
	1878		nl = [n for n in nl if hex(n).startswith(id) and
	1879		self.hasnode(n)]
	1880		if nullhex.startswith(id):
	1881		nl.append(nullid)
	1882		if len(nl) > 0:
	1883		if len(nl) == 1 and not maybewdir:
	1884		self._pcache[id] = nl[0]
	1885		return nl[0]
	1886		raise AmbiguousPrefixLookupError(id, self.indexfile,
	1887		_('ambiguous identifier'))
	1888		if maybewdir:
	1889		raise error.WdirUnsupported
	1890		return None
	1891		except TypeError:
	1892		pass
	1893
	1894		def lookup(self, id):
	1895		"""locate a node based on:
	1896		- revision number or str(revision number)
	1897		- nodeid or subset of hex nodeid
	1898		"""
	1899		n = self._match(id)
	1900		if n is not None:
	1901		return n
	1902		n = self._partialmatch(id)
	1903		if n:
	1904		return n
	1905
	1906		raise LookupError(id, self.indexfile, _('no match found'))
	1907
	1908		def shortest(self, node, minlength=1):
	1909		"""Find the shortest unambiguous prefix that matches node."""
	1910		def isvalid(prefix):
	1911		try:
	1912		node = self._partialmatch(prefix)
	1913		except error.RevlogError:
	1914		return False
	1915		except error.WdirUnsupported:
	1916		# single 'ff...' match
	1917		return True
	1918		if node is None:
	1919		raise LookupError(node, self.indexfile, _('no node'))
	1920		return True
	1921
	1922		def maybewdir(prefix):
	1923		return all(c == 'f' for c in prefix)
	1924
	1925		hexnode = hex(node)
	1926
	1927		def disambiguate(hexnode, minlength):
	1928		"""Disambiguate against wdirid."""
	1929		for length in range(minlength, 41):
	1930		prefix = hexnode[:length]
	1931		if not maybewdir(prefix):
	1932		return prefix
	1933
	1934		if not getattr(self, 'filteredrevs', None):
	1935		try:
	1936		length = max(self.index.shortest(node), minlength)
	1937		return disambiguate(hexnode, length)
	1938		except RevlogError:
	1939		if node != wdirid:
	1940		raise LookupError(node, self.indexfile, _('no node'))
	1941		except AttributeError:
	1942		# Fall through to pure code
	1943		pass
	1944
	1945		if node == wdirid:
	1946		for length in range(minlength, 41):
	1947		prefix = hexnode[:length]
	1948		if isvalid(prefix):
	1949		return prefix
	1950
	1951		for length in range(minlength, 41):
	1952		prefix = hexnode[:length]
	1953		if isvalid(prefix):
	1954		return disambiguate(hexnode, length)
	1955
	1956		def cmp(self, node, text):
	1957		"""compare text with a given file revision
	1958
	1959		returns True if text is different than what is stored.
	1960		"""
	1961		p1, p2 = self.parents(node)
	1962		return hash(text, p1, p2) != node
	1963
	1964		def _cachesegment(self, offset, data):
	1965		"""Add a segment to the revlog cache.
	1966
	1967		Accepts an absolute offset and the data that is at that location.
	1968		"""
	1969		o, d = self._chunkcache
	1970		# try to add to existing cache
	1971		if o + len(d) == offset and len(d) + len(data) < _chunksize:
	1972		self._chunkcache = o, d + data
	1973		else:
	1974		self._chunkcache = offset, data
	1975
	1976		def _readsegment(self, offset, length, df=None):
	1977		"""Load a segment of raw data from the revlog.
	1978
	1979		Accepts an absolute offset, length to read, and an optional existing
	1980		file handle to read from.
	1981
	1982		If an existing file handle is passed, it will be seeked and the
	1983		original seek position will NOT be restored.
	1984
	1985		Returns a str or buffer of raw byte data.
	1986		"""
	1987		# Cache data both forward and backward around the requested
	1988		# data, in a fixed size window. This helps speed up operations
	1989		# involving reading the revlog backwards.
	1990		cachesize = self._chunkcachesize
	1991		realoffset = offset & ~(cachesize - 1)
	1992		reallength = (((offset + length + cachesize) & ~(cachesize - 1))
	1993		- realoffset)
	1994		with self._datareadfp(df) as df:
	1995		df.seek(realoffset)
	1996		d = df.read(reallength)
	1997		self._cachesegment(realoffset, d)
	1998		if offset != realoffset or reallength != length:
	1999		return util.buffer(d, offset - realoffset, length)
	2000		return d
	2001
	2002		def _getsegment(self, offset, length, df=None):
	2003		"""Obtain a segment of raw data from the revlog.
	2004
	2005		Accepts an absolute offset, length of bytes to obtain, and an
	2006		optional file handle to the already-opened revlog. If the file
	2007		handle is used, it's original seek position will not be preserved.
	2008
	2009		Requests for data may be returned from a cache.
	2010
	2011		Returns a str or a buffer instance of raw byte data.
	2012		"""
	2013		o, d = self._chunkcache
	2014		l = len(d)
	2015
	2016		# is it in the cache?
	2017		cachestart = offset - o
	2018		cacheend = cachestart + length
	2019		if cachestart >= 0 and cacheend <= l:
	2020		if cachestart == 0 and cacheend == l:
	2021		return d # avoid a copy
	2022		return util.buffer(d, cachestart, cacheend - cachestart)
	2023
	2024		return self._readsegment(offset, length, df=df)
	2025
	2026		def _getsegmentforrevs(self, startrev, endrev, df=None):
	2027		"""Obtain a segment of raw data corresponding to a range of revisions.
	2028
	2029		Accepts the start and end revisions and an optional already-open
	2030		file handle to be used for reading. If the file handle is read, its
	2031		seek position will not be preserved.
	2032
	2033		Requests for data may be satisfied by a cache.
	2034
	2035		Returns a 2-tuple of (offset, data) for the requested range of
	2036		revisions. Offset is the integer offset from the beginning of the
	2037		revlog and data is a str or buffer of the raw byte data.
	2038
	2039		Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
	2040		to determine where each revision's data begins and ends.
	2041		"""
	2042		# Inlined self.start(startrev) & self.end(endrev) for perf reasons
	2043		# (functions are expensive).
	2044		index = self.index
	2045		istart = index[startrev]
	2046		start = int(istart[0] >> 16)
	2047		if startrev == endrev:
	2048		end = start + istart[1]
	2049		else:
	2050		iend = index[endrev]
	2051		end = int(iend[0] >> 16) + iend[1]
	2052
	2053		if self._inline:
	2054		start += (startrev + 1) * self._io.size
	2055		end += (endrev + 1) * self._io.size
	2056		length = end - start
	2057
	2058		return start, self._getsegment(start, length, df=df)
	2059
	2060		def _chunk(self, rev, df=None):
	2061		"""Obtain a single decompressed chunk for a revision.
	2062
	2063		Accepts an integer revision and an optional already-open file handle
	2064		to be used for reading. If used, the seek position of the file will not
	2065		be preserved.
	2066
	2067		Returns a str holding uncompressed data for the requested revision.
	2068		"""
	2069		return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])
	2070
	2071		def _chunks(self, revs, df=None, targetsize=None):
	2072		"""Obtain decompressed chunks for the specified revisions.
	2073
	2074		Accepts an iterable of numeric revisions that are assumed to be in
	2075		ascending order. Also accepts an optional already-open file handle
	2076		to be used for reading. If used, the seek position of the file will
	2077		not be preserved.
	2078
	2079		This function is similar to calling ``self._chunk()`` multiple times,
	2080		but is faster.
	2081
	2082		Returns a list with decompressed data for each requested revision.
	2083		"""
	2084		if not revs:
	2085		return []
	2086		start = self.start
	2087		length = self.length
	2088		inline = self._inline
	2089		iosize = self._io.size
	2090		buffer = util.buffer
	2091
	2092		l = []
	2093		ladd = l.append
	2094
	2095		if not self._withsparseread:
	2096		slicedchunks = (revs,)
	2097		else:
	2098		slicedchunks = _slicechunk(self, revs, targetsize=targetsize)
	2099
	2100		for revschunk in slicedchunks:
	2101		firstrev = revschunk[0]
	2102		# Skip trailing revisions with empty diff
	2103		for lastrev in revschunk[::-1]:
	2104		if length(lastrev) != 0:
	2105		break
	2106
	2107		try:
	2108		offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)
	2109		except OverflowError:
	2110		# issue4215 - we can't cache a run of chunks greater than
	2111		# 2G on Windows
	2112		return [self._chunk(rev, df=df) for rev in revschunk]
	2113
	2114		decomp = self.decompress
	2115		for rev in revschunk:
	2116		chunkstart = start(rev)
	2117		if inline:
	2118		chunkstart += (rev + 1) * iosize
	2119		chunklength = length(rev)
	2120		ladd(decomp(buffer(data, chunkstart - offset, chunklength)))
	2121
	2122		return l
	2123
	2124		def _chunkclear(self):
	2125		"""Clear the raw chunk cache."""
	2126		self._chunkcache = (0, '')
	2127
	2128		def deltaparent(self, rev):
	2129		"""return deltaparent of the given revision"""
	2130		base = self.index[rev][3]
	2131		if base == rev:
	2132		return nullrev
	2133		elif self._generaldelta:
	2134		return base
	2135		else:
	2136		return rev - 1
	2137
	2138		def issnapshot(self, rev):
	2139		"""tells whether rev is a snapshot
	2140		"""
	2141		if rev == nullrev:
	2142		return True
	2143		deltap = self.deltaparent(rev)
	2144		if deltap == nullrev:
	2145		return True
	2146		p1, p2 = self.parentrevs(rev)
	2147		if deltap in (p1, p2):
	2148		return False
	2149		return self.issnapshot(deltap)
	2150
	2151		def snapshotdepth(self, rev):
	2152		"""number of snapshot in the chain before this one"""
	2153		if not self.issnapshot(rev):
	2154		raise ProgrammingError('revision %d not a snapshot')
	2155		return len(self._deltachain(rev)[0]) - 1
	2156
	2157		def revdiff(self, rev1, rev2):
	2158		"""return or calculate a delta between two revisions
	2159
	2160		The delta calculated is in binary form and is intended to be written to
	2161		revlog data directly. So this function needs raw revision data.
	2162		"""
	2163		if rev1 != nullrev and self.deltaparent(rev2) == rev1:
	2164		return bytes(self._chunk(rev2))
	2165
	2166		return mdiff.textdiff(self.revision(rev1, raw=True),
	2167		self.revision(rev2, raw=True))
	2168
	2169		def revision(self, nodeorrev, _df=None, raw=False):
	2170		"""return an uncompressed revision of a given node or revision
	2171		number.
	2172
	2173		_df - an existing file handle to read from. (internal-only)
	2174		raw - an optional argument specifying if the revision data is to be
	2175		treated as raw data when applying flag transforms. 'raw' should be set
	2176		to True when generating changegroups or in debug commands.
	2177		"""
	2178		if isinstance(nodeorrev, int):
	2179		rev = nodeorrev
	2180		node = self.node(rev)
	2181		else:
	2182		node = nodeorrev
	2183		rev = None
	2184
	2185		cachedrev = None
	2186		flags = None
	2187		rawtext = None
	2188		if node == nullid:
	2189		return ""
	2190		if self._cache:
	2191		if self._cache[0] == node:
	2192		# _cache only stores rawtext
	2193		if raw:
	2194		return self._cache[2]
	2195		# duplicated, but good for perf
	2196		if rev is None:
	2197		rev = self.rev(node)
	2198		if flags is None:
	2199		flags = self.flags(rev)
	2200		# no extra flags set, no flag processor runs, text = rawtext
	2201		if flags == REVIDX_DEFAULT_FLAGS:
	2202		return self._cache[2]
	2203		# rawtext is reusable. need to run flag processor
	2204		rawtext = self._cache[2]
	2205
	2206		cachedrev = self._cache[1]
	2207
	2208		# look up what we need to read
	2209		if rawtext is None:
	2210		if rev is None:
	2211		rev = self.rev(node)
	2212
	2213		chain, stopped = self._deltachain(rev, stoprev=cachedrev)
	2214		if stopped:
	2215		rawtext = self._cache[2]
	2216
	2217		# drop cache to save memory
	2218		self._cache = None
	2219
	2220		targetsize = None
	2221		rawsize = self.index[rev][2]
	2222		if 0 <= rawsize:
	2223		targetsize = 4 * rawsize
	2224
	2225		bins = self._chunks(chain, df=_df, targetsize=targetsize)
	2226		if rawtext is None:
	2227		rawtext = bytes(bins[0])
	2228		bins = bins[1:]
	2229
	2230		rawtext = mdiff.patches(rawtext, bins)
	2231		self._cache = (node, rev, rawtext)
	2232
	2233		if flags is None:
	2234		if rev is None:
	2235		rev = self.rev(node)
	2236		flags = self.flags(rev)
	2237
	2238		text, validatehash = self._processflags(rawtext, flags, 'read', raw=raw)
	2239		if validatehash:
	2240		self.checkhash(text, node, rev=rev)
	2241
	2242		return text
	2243
	2244		def hash(self, text, p1, p2):
	2245		"""Compute a node hash.
	2246
	2247		Available as a function so that subclasses can replace the hash
	2248		as needed.
	2249		"""
	2250		return hash(text, p1, p2)
	2251
	2252		def _processflags(self, text, flags, operation, raw=False):
	2253		"""Inspect revision data flags and applies transforms defined by
	2254		registered flag processors.
	2255
	2256		``text`` - the revision data to process
	2257		``flags`` - the revision flags
	2258		``operation`` - the operation being performed (read or write)
	2259		``raw`` - an optional argument describing if the raw transform should be
	2260		applied.
	2261
	2262		This method processes the flags in the order (or reverse order if
	2263		``operation`` is 'write') defined by REVIDX_FLAGS_ORDER, applying the
	2264		flag processors registered for present flags. The order of flags defined
	2265		in REVIDX_FLAGS_ORDER needs to be stable to allow non-commutativity.
	2266
	2267		Returns a 2-tuple of ``(text, validatehash)`` where ``text`` is the
	2268		processed text and ``validatehash`` is a bool indicating whether the
	2269		returned text should be checked for hash integrity.
	2270
	2271		Note: If the ``raw`` argument is set, it has precedence over the
	2272		operation and will only update the value of ``validatehash``.
	2273		"""
	2274		# fast path: no flag processors will run
	2275		if flags == 0:
	2276		return text, True
	2277		if not operation in ('read', 'write'):
	2278		raise ProgrammingError(_("invalid '%s' operation ") % (operation))
	2279		# Check all flags are known.
	2280		if flags & ~REVIDX_KNOWN_FLAGS:
	2281		raise RevlogError(_("incompatible revision flag '%#x'") %
	2282		(flags & ~REVIDX_KNOWN_FLAGS))
	2283		validatehash = True
	2284		# Depending on the operation (read or write), the order might be
	2285		# reversed due to non-commutative transforms.
	2286		orderedflags = REVIDX_FLAGS_ORDER
	2287		if operation == 'write':
	2288		orderedflags = reversed(orderedflags)
	2289
	2290		for flag in orderedflags:
	2291		# If a flagprocessor has been registered for a known flag, apply the
	2292		# related operation transform and update result tuple.
	2293		if flag & flags:
	2294		vhash = True
	2295
	2296		if flag not in _flagprocessors:
	2297		message = _("missing processor for flag '%#x'") % (flag)
	2298		raise RevlogError(message)
	2299
	2300		processor = _flagprocessors[flag]
	2301		if processor is not None:
	2302		readtransform, writetransform, rawtransform = processor
	2303
	2304		if raw:
	2305		vhash = rawtransform(self, text)
	2306		elif operation == 'read':
	2307		text, vhash = readtransform(self, text)
	2308		else: # write operation
	2309		text, vhash = writetransform(self, text)
	2310		validatehash = validatehash and vhash
	2311
	2312		return text, validatehash
	2313
	2314		def checkhash(self, text, node, p1=None, p2=None, rev=None):
	2315		"""Check node hash integrity.
	2316
	2317		Available as a function so that subclasses can extend hash mismatch
	2318		behaviors as needed.
	2319		"""
	2320		try:
	2321		if p1 is None and p2 is None:
	2322		p1, p2 = self.parents(node)
	2323		if node != self.hash(text, p1, p2):
	2324		revornode = rev
	2325		if revornode is None:
	2326		revornode = templatefilters.short(hex(node))
	2327		raise RevlogError(_("integrity check failed on %s:%s")
	2328		% (self.indexfile, pycompat.bytestr(revornode)))
	2329		except RevlogError:
	2330		if self._censorable and _censoredtext(text):
	2331		raise error.CensoredNodeError(self.indexfile, node, text)
	2332		raise
	2333
	2334		def _enforceinlinesize(self, tr, fp=None):
	2335		"""Check if the revlog is too big for inline and convert if so.
	2336
	2337		This should be called after revisions are added to the revlog. If the
	2338		revlog has grown too large to be an inline revlog, it will convert it
	2339		to use multiple index and data files.
	2340		"""
	2341		tiprev = len(self) - 1
	2342		if (not self._inline or
	2343		(self.start(tiprev) + self.length(tiprev)) < _maxinline):
	2344		return
	2345
	2346		trinfo = tr.find(self.indexfile)
	2347		if trinfo is None:
	2348		raise RevlogError(_("%s not found in the transaction")
	2349		% self.indexfile)
	2350
	2351		trindex = trinfo[2]
	2352		if trindex is not None:
	2353		dataoff = self.start(trindex)
	2354		else:
	2355		# revlog was stripped at start of transaction, use all leftover data
	2356		trindex = len(self) - 1
	2357		dataoff = self.end(tiprev)
	2358
	2359		tr.add(self.datafile, dataoff)
	2360
	2361		if fp:
	2362		fp.flush()
	2363		fp.close()
	2364
	2365		with self._datafp('w') as df:
	2366		for r in self:
	2367		df.write(self._getsegmentforrevs(r, r)[1])
	2368
	2369		with self._indexfp('w') as fp:
	2370		self.version &= ~FLAG_INLINE_DATA
	2371		self._inline = False
	2372		io = self._io
	2373		for i in self:
	2374		e = io.packentry(self.index[i], self.node, self.version, i)
	2375		fp.write(e)
	2376
	2377		# the temp file replace the real index when we exit the context
	2378		# manager
	2379
	2380		tr.replace(self.indexfile, trindex * self._io.size)
	2381		self._chunkclear()
	2382
	2383		def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
	2384		node=None, flags=REVIDX_DEFAULT_FLAGS, deltacomputer=None):
	2385		"""add a revision to the log
	2386
	2387		text - the revision data to add
	2388		transaction - the transaction object used for rollback
	2389		link - the linkrev data to add
	2390		p1, p2 - the parent nodeids of the revision
	2391		cachedelta - an optional precomputed delta
	2392		node - nodeid of revision; typically node is not specified, and it is
	2393		computed by default as hash(text, p1, p2), however subclasses might
	2394		use different hashing method (and override checkhash() in such case)
	2395		flags - the known flags to set on the revision
	2396		deltacomputer - an optional _deltacomputer instance shared between
	2397		multiple calls
	2398		"""
	2399		if link == nullrev:
	2400		raise RevlogError(_("attempted to add linkrev -1 to %s")
	2401		% self.indexfile)
	2402
	2403		if flags:
	2404		node = node or self.hash(text, p1, p2)
	2405
	2406		rawtext, validatehash = self._processflags(text, flags, 'write')
	2407
	2408		# If the flag processor modifies the revision data, ignore any provided
	2409		# cachedelta.
	2410		if rawtext != text:
	2411		cachedelta = None
	2412
	2413		if len(rawtext) > _maxentrysize:
	2414		raise RevlogError(
	2415		_("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")
	2416		% (self.indexfile, len(rawtext)))
	2417
	2418		node = node or self.hash(rawtext, p1, p2)
	2419		if node in self.nodemap:
	2420		return node
	2421
	2422		if validatehash:
	2423		self.checkhash(rawtext, node, p1=p1, p2=p2)
	2424
	2425		return self.addrawrevision(rawtext, transaction, link, p1, p2, node,
	2426		flags, cachedelta=cachedelta,
	2427		deltacomputer=deltacomputer)
	2428
	2429		def addrawrevision(self, rawtext, transaction, link, p1, p2, node, flags,
	2430		cachedelta=None, deltacomputer=None):
	2431		"""add a raw revision with known flags, node and parents
	2432		useful when reusing a revision not stored in this revlog (ex: received
	2433		over wire, or read from an external bundle).
	2434		"""
	2435		dfh = None
	2436		if not self._inline:
	2437		dfh = self._datafp("a+")
	2438		ifh = self._indexfp("a+")
	2439		try:
	2440		return self._addrevision(node, rawtext, transaction, link, p1, p2,
	2441		flags, cachedelta, ifh, dfh,
	2442		deltacomputer=deltacomputer)
	2443		finally:
	2444		if dfh:
	2445		dfh.close()
	2446		ifh.close()
	2447
	2448		def compress(self, data):
	2449		"""Generate a possibly-compressed representation of data."""
	2450		if not data:
	2451		return '', data
	2452
	2453		compressed = self._compressor.compress(data)
	2454
	2455		if compressed:
	2456		# The revlog compressor added the header in the returned data.
	2457		return '', compressed
	2458
	2459		if data[0:1] == '\0':
	2460		return '', data
	2461		return 'u', data
	2462
	2463		def decompress(self, data):
	2464		"""Decompress a revlog chunk.
	2465
	2466		The chunk is expected to begin with a header identifying the
	2467		format type so it can be routed to an appropriate decompressor.
	2468		"""
	2469		if not data:
	2470		return data
	2471
	2472		# Revlogs are read much more frequently than they are written and many
	2473		# chunks only take microseconds to decompress, so performance is
	2474		# important here.
	2475		#
	2476		# We can make a few assumptions about revlogs:
	2477		#
	2478		# 1) the majority of chunks will be compressed (as opposed to inline
	2479		# raw data).
	2480		# 2) decompressing any data will likely by at least 10x slower than
	2481		# returning raw inline data.
	2482		# 3) we want to prioritize common and officially supported compression
	2483		# engines
	2484		#
	2485		# It follows that we want to optimize for "decompress compressed data
	2486		# when encoded with common and officially supported compression engines"
	2487		# case over "raw data" and "data encoded by less common or non-official
	2488		# compression engines." That is why we have the inline lookup first
	2489		# followed by the compengines lookup.
	2490		#
	2491		# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
	2492		# compressed chunks. And this matters for changelog and manifest reads.
	2493		t = data[0:1]
	2494
	2495		if t == 'x':
	2496		try:
	2497		return _zlibdecompress(data)
	2498		except zlib.error as e:
	2499		raise RevlogError(_('revlog decompress error: %s') %
	2500		stringutil.forcebytestr(e))
	2501		# '\0' is more common than 'u' so it goes first.
	2502		elif t == '\0':
	2503		return data
	2504		elif t == 'u':
	2505		return util.buffer(data, 1)
	2506
	2507		try:
	2508		compressor = self._decompressors[t]
	2509		except KeyError:
	2510		try:
	2511		engine = util.compengines.forrevlogheader(t)
	2512		compressor = engine.revlogcompressor()
	2513		self._decompressors[t] = compressor
	2514		except KeyError:
	2515		raise RevlogError(_('unknown compression type %r') % t)
	2516
	2517		return compressor.decompress(data)
	2518
	2519		def _isgooddeltainfo(self, deltainfo, revinfo):
	2520		"""Returns True if the given delta is good. Good means that it is within
	2521		the disk span, disk size, and chain length bounds that we know to be
	2522		performant."""
	2523		if deltainfo is None:
	2524		return False
	2525
	2526		# - 'deltainfo.distance' is the distance from the base revision --
	2527		# bounding it limits the amount of I/O we need to do.
	2528		# - 'deltainfo.compresseddeltalen' is the sum of the total size of
	2529		# deltas we need to apply -- bounding it limits the amount of CPU
	2530		# we consume.
	2531
	2532		if self._sparserevlog:
	2533		# As sparse-read will be used, we can consider that the distance,
	2534		# instead of being the span of the whole chunk,
	2535		# is the span of the largest read chunk
	2536		base = deltainfo.base
	2537
	2538		if base != nullrev:
	2539		deltachain = self._deltachain(base)[0]
	2540		else:
	2541		deltachain = []
	2542
	2543		# search for the first non-snapshot revision
	2544		for idx, r in enumerate(deltachain):
	2545		if not self.issnapshot(r):
	2546		break
	2547		deltachain = deltachain[idx:]
	2548		chunks = _slicechunk(self, deltachain, deltainfo)
	2549		all_span = [_segmentspan(self, revs, deltainfo) for revs in chunks]
	2550		distance = max(all_span)
	2551		else:
	2552		distance = deltainfo.distance
	2553
	2554		textlen = revinfo.textlen
	2555		defaultmax = textlen * 4
	2556		maxdist = self._maxdeltachainspan
	2557		if not maxdist:
	2558		maxdist = distance # ensure the conditional pass
	2559		maxdist = max(maxdist, defaultmax)
	2560		if self._sparserevlog and maxdist < self._srmingapsize:
	2561		# In multiple place, we are ignoring irrelevant data range below a
	2562		# certain size. Be also apply this tradeoff here and relax span
	2563		# constraint for small enought content.
	2564		maxdist = self._srmingapsize
	2565
	2566		# Bad delta from read span:
	2567		#
	2568		# If the span of data read is larger than the maximum allowed.
	2569		if maxdist < distance:
	2570		return False
	2571
	2572		# Bad delta from new delta size:
	2573		#
	2574		# If the delta size is larger than the target text, storing the
	2575		# delta will be inefficient.
	2576		if textlen < deltainfo.deltalen:
	2577		return False
	2578
	2579		# Bad delta from cumulated payload size:
	2580		#
	2581		# If the sum of delta get larger than K * target text length.
	2582		if textlen * LIMIT_DELTA2TEXT < deltainfo.compresseddeltalen:
	2583		return False
	2584
	2585		# Bad delta from chain length:
	2586		#
	2587		# If the number of delta in the chain gets too high.
	2588		if self._maxchainlen and self._maxchainlen < deltainfo.chainlen:
	2589		return False
	2590
	2591		# bad delta from intermediate snapshot size limit
	2592		#
	2593		# If an intermediate snapshot size is higher than the limit. The
	2594		# limit exist to prevent endless chain of intermediate delta to be
	2595		# created.
	2596		if (deltainfo.snapshotdepth is not None and
	2597		(textlen >> deltainfo.snapshotdepth) < deltainfo.deltalen):
	2598		return False
	2599
	2600		# bad delta if new intermediate snapshot is larger than the previous
	2601		# snapshot
	2602		if (deltainfo.snapshotdepth
	2603		and self.length(deltainfo.base) < deltainfo.deltalen):
	2604		return False
	2605
	2606		return True
	2607
	2608		def _addrevision(self, node, rawtext, transaction, link, p1, p2, flags,
	2609		cachedelta, ifh, dfh, alwayscache=False,
	2610		deltacomputer=None):
	2611		"""internal function to add revisions to the log
	2612
	2613		see addrevision for argument descriptions.
	2614
	2615		note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
	2616
	2617		if "deltacomputer" is not provided or None, a defaultdeltacomputer will
	2618		be used.
	2619
	2620		invariants:
	2621		- rawtext is optional (can be None); if not set, cachedelta must be set.
	2622		if both are set, they must correspond to each other.
	2623		"""
	2624		if node == nullid:
	2625		raise RevlogError(_("%s: attempt to add null revision") %
	2626		(self.indexfile))
	2627		if node == wdirid or node in wdirfilenodeids:
	2628		raise RevlogError(_("%s: attempt to add wdir revision") %
	2629		(self.indexfile))
	2630
	2631		if self._inline:
	2632		fh = ifh
	2633		else:
	2634		fh = dfh
	2635
	2636		btext = [rawtext]
	2637
	2638		curr = len(self)
	2639		prev = curr - 1
	2640		offset = self.end(prev)
	2641		p1r, p2r = self.rev(p1), self.rev(p2)
	2642
	2643		# full versions are inserted when the needed deltas
	2644		# become comparable to the uncompressed text
	2645		if rawtext is None:
	2646		# need rawtext size, before changed by flag processors, which is
	2647		# the non-raw size. use revlog explicitly to avoid filelog's extra
	2648		# logic that might remove metadata size.
	2649		textlen = mdiff.patchedsize(revlog.size(self, cachedelta[0]),
	2650		cachedelta[1])
	2651		else:
	2652		textlen = len(rawtext)
	2653
	2654		if deltacomputer is None:
	2655		deltacomputer = _deltacomputer(self)
	2656
	2657		revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)
	2658
	2659		# no delta for flag processor revision (see "candelta" for why)
	2660		# not calling candelta since only one revision needs test, also to
	2661		# avoid overhead fetching flags again.
	2662		if flags & REVIDX_RAWTEXT_CHANGING_FLAGS:
	2663		deltainfo = None
	2664		else:
	2665		deltainfo = deltacomputer.finddeltainfo(revinfo, fh)
	2666
	2667		if deltainfo is not None:
	2668		base = deltainfo.base
	2669		chainbase = deltainfo.chainbase
	2670		data = deltainfo.data
	2671		l = deltainfo.deltalen
	2672		else:
	2673		rawtext = deltacomputer.buildtext(revinfo, fh)
	2674		data = self.compress(rawtext)
	2675		l = len(data[1]) + len(data[0])
	2676		base = chainbase = curr
	2677
	2678		e = (offset_type(offset, flags), l, textlen,
	2679		base, link, p1r, p2r, node)
	2680		self.index.append(e)
	2681		self.nodemap[node] = curr
	2682
	2683		entry = self._io.packentry(e, self.node, self.version, curr)
	2684		self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
	2685
	2686		if alwayscache and rawtext is None:
	2687		rawtext = deltacomputer.buildtext(revinfo, fh)
	2688
	2689		if type(rawtext) == bytes: # only accept immutable objects
	2690		self._cache = (node, curr, rawtext)
	2691		self._chainbasecache[curr] = chainbase
	2692		return node
	2693
	2694		def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
	2695		# Files opened in a+ mode have inconsistent behavior on various
	2696		# platforms. Windows requires that a file positioning call be made
	2697		# when the file handle transitions between reads and writes. See
	2698		# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
	2699		# platforms, Python or the platform itself can be buggy. Some versions
	2700		# of Solaris have been observed to not append at the end of the file
	2701		# if the file was seeked to before the end. See issue4943 for more.
	2702		#
	2703		# We work around this issue by inserting a seek() before writing.
	2704		# Note: This is likely not necessary on Python 3.
	2705		ifh.seek(0, os.SEEK_END)
	2706		if dfh:
	2707		dfh.seek(0, os.SEEK_END)
	2708
	2709		curr = len(self) - 1
	2710		if not self._inline:
	2711		transaction.add(self.datafile, offset)
	2712		transaction.add(self.indexfile, curr * len(entry))
	2713		if data[0]:
	2714		dfh.write(data[0])
	2715		dfh.write(data[1])
	2716		ifh.write(entry)
	2717		else:
	2718		offset += curr * self._io.size
	2719		transaction.add(self.indexfile, offset, curr)
	2720		ifh.write(entry)
	2721		ifh.write(data[0])
	2722		ifh.write(data[1])
	2723		self._enforceinlinesize(transaction, ifh)
	2724
	2725		def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
	2726		"""
	2727		add a delta group
	2728
	2729		given a set of deltas, add them to the revision log. the
	2730		first delta is against its parent, which should be in our
	2731		log, the rest are against the previous delta.
	2732
	2733		If ``addrevisioncb`` is defined, it will be called with arguments of
	2734		this revlog and the node that was added.
	2735		"""
	2736
	2737		nodes = []
	2738
	2739		r = len(self)
	2740		end = 0
	2741		if r:
	2742		end = self.end(r - 1)
	2743		ifh = self._indexfp("a+")
	2744		isize = r * self._io.size
	2745		if self._inline:
	2746		transaction.add(self.indexfile, end + isize, r)
	2747		dfh = None
	2748		else:
	2749		transaction.add(self.indexfile, isize, r)
	2750		transaction.add(self.datafile, end)
	2751		dfh = self._datafp("a+")
	2752		def flush():
	2753		if dfh:
	2754		dfh.flush()
	2755		ifh.flush()
	2756		try:
	2757		deltacomputer = _deltacomputer(self)
	2758		# loop through our set of deltas
	2759		for data in deltas:
	2760		node, p1, p2, linknode, deltabase, delta, flags = data
	2761		link = linkmapper(linknode)
	2762		flags = flags or REVIDX_DEFAULT_FLAGS
	2763
	2764		nodes.append(node)
	2765
	2766		if node in self.nodemap:
	2767		# this can happen if two branches make the same change
	2768		continue
	2769
	2770		for p in (p1, p2):
	2771		if p not in self.nodemap:
	2772		raise LookupError(p, self.indexfile,
	2773		_('unknown parent'))
	2774
	2775		if deltabase not in self.nodemap:
	2776		raise LookupError(deltabase, self.indexfile,
	2777		_('unknown delta base'))
	2778
	2779		baserev = self.rev(deltabase)
	2780
	2781		if baserev != nullrev and self.iscensored(baserev):
	2782		# if base is censored, delta must be full replacement in a
	2783		# single patch operation
	2784		hlen = struct.calcsize(">lll")
	2785		oldlen = self.rawsize(baserev)
	2786		newlen = len(delta) - hlen
	2787		if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
	2788		raise error.CensoredBaseError(self.indexfile,
	2789		self.node(baserev))
	2790
	2791		if not flags and self._peek_iscensored(baserev, delta, flush):
	2792		flags \|= REVIDX_ISCENSORED
	2793
	2794		# We assume consumers of addrevisioncb will want to retrieve
	2795		# the added revision, which will require a call to
	2796		# revision(). revision() will fast path if there is a cache
	2797		# hit. So, we tell _addrevision() to always cache in this case.
	2798		# We're only using addgroup() in the context of changegroup
	2799		# generation so the revision data can always be handled as raw
	2800		# by the flagprocessor.
	2801		self._addrevision(node, None, transaction, link,
	2802		p1, p2, flags, (baserev, delta),
	2803		ifh, dfh,
	2804		alwayscache=bool(addrevisioncb),
	2805		deltacomputer=deltacomputer)
	2806
	2807		if addrevisioncb:
	2808		addrevisioncb(self, node)
	2809
	2810		if not dfh and not self._inline:
	2811		# addrevision switched from inline to conventional
	2812		# reopen the index
	2813		ifh.close()
	2814		dfh = self._datafp("a+")
	2815		ifh = self._indexfp("a+")
	2816		finally:
	2817		if dfh:
	2818		dfh.close()
	2819		ifh.close()
	2820
	2821		return nodes
	2822
	2823		def iscensored(self, rev):
	2824		"""Check if a file revision is censored."""
	2825		if not self._censorable:
	2826		return False
	2827
	2828		return self.flags(rev) & REVIDX_ISCENSORED
	2829
	2830		def _peek_iscensored(self, baserev, delta, flush):
	2831		"""Quickly check if a delta produces a censored revision."""
	2832		if not self._censorable:
	2833		return False
	2834
	2835		# Fragile heuristic: unless new file meta keys are added alphabetically
	2836		# preceding "censored", all censored revisions are prefixed by
	2837		# "\1\ncensored:". A delta producing such a censored revision must be a
	2838		# full-replacement delta, so we inspect the first and only patch in the
	2839		# delta for this prefix.
	2840		hlen = struct.calcsize(">lll")
	2841		if len(delta) <= hlen:
	2842		return False
	2843
	2844		oldlen = self.rawsize(baserev)
	2845		newlen = len(delta) - hlen
	2846		if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
	2847		return False
	2848
	2849		add = "\1\ncensored:"
	2850		addlen = len(add)
	2851		return newlen >= addlen and delta[hlen:hlen + addlen] == add
	2852
	2853		def getstrippoint(self, minlink):
	2854		"""find the minimum rev that must be stripped to strip the linkrev
	2855
	2856		Returns a tuple containing the minimum rev and a set of all revs that
	2857		have linkrevs that will be broken by this strip.
	2858		"""
	2859		brokenrevs = set()
	2860		strippoint = len(self)
	2861
	2862		heads = {}
	2863		futurelargelinkrevs = set()
	2864		for head in self.headrevs():
	2865		headlinkrev = self.linkrev(head)
	2866		heads[head] = headlinkrev
	2867		if headlinkrev >= minlink:
	2868		futurelargelinkrevs.add(headlinkrev)
	2869
	2870		# This algorithm involves walking down the rev graph, starting at the
	2871		# heads. Since the revs are topologically sorted according to linkrev,
	2872		# once all head linkrevs are below the minlink, we know there are
	2873		# no more revs that could have a linkrev greater than minlink.
	2874		# So we can stop walking.
	2875		while futurelargelinkrevs:
	2876		strippoint -= 1
	2877		linkrev = heads.pop(strippoint)
	2878
	2879		if linkrev < minlink:
	2880		brokenrevs.add(strippoint)
	2881		else:
	2882		futurelargelinkrevs.remove(linkrev)
	2883
	2884		for p in self.parentrevs(strippoint):
	2885		if p != nullrev:
	2886		plinkrev = self.linkrev(p)
	2887		heads[p] = plinkrev
	2888		if plinkrev >= minlink:
	2889		futurelargelinkrevs.add(plinkrev)
	2890
	2891		return strippoint, brokenrevs
	2892
	2893		def strip(self, minlink, transaction):
	2894		"""truncate the revlog on the first revision with a linkrev >= minlink
	2895
	2896		This function is called when we're stripping revision minlink and
	2897		its descendants from the repository.
	2898
	2899		We have to remove all revisions with linkrev >= minlink, because
	2900		the equivalent changelog revisions will be renumbered after the
	2901		strip.
	2902
	2903		So we truncate the revlog on the first of these revisions, and
	2904		trust that the caller has saved the revisions that shouldn't be
	2905		removed and that it'll re-add them after this truncation.
	2906		"""
	2907		if len(self) == 0:
	2908		return
	2909
	2910		rev, _ = self.getstrippoint(minlink)
	2911		if rev == len(self):
	2912		return
	2913
	2914		# first truncate the files on disk
	2915		end = self.start(rev)
	2916		if not self._inline:
	2917		transaction.add(self.datafile, end)
	2918		end = rev * self._io.size
	2919		else:
	2920		end += rev * self._io.size
	2921
	2922		transaction.add(self.indexfile, end)
	2923
	2924		# then reset internal state in memory to forget those revisions
	2925		self._cache = None
	2926		self._chaininfocache = {}
	2927		self._chunkclear()
	2928		for x in pycompat.xrange(rev, len(self)):
	2929		del self.nodemap[self.node(x)]
	2930
	2931		del self.index[rev:-1]
	2932		self._nodepos = None
	2933
	2934		def checksize(self):
	2935		expected = 0
	2936		if len(self):
	2937		expected = max(0, self.end(len(self) - 1))
	2938
	2939		try:
	2940		with self._datafp() as f:
	2941		f.seek(0, 2)
	2942		actual = f.tell()
	2943		dd = actual - expected
	2944		except IOError as inst:
	2945		if inst.errno != errno.ENOENT:
	2946		raise
	2947		dd = 0
	2948
	2949		try:
	2950		f = self.opener(self.indexfile)
	2951		f.seek(0, 2)
	2952		actual = f.tell()
	2953		f.close()
	2954		s = self._io.size
	2955		i = max(0, actual // s)
	2956		di = actual - (i * s)
	2957		if self._inline:
	2958		databytes = 0
	2959		for r in self:
	2960		databytes += max(0, self.length(r))
	2961		dd = 0
	2962		di = actual - len(self) * s - databytes
	2963		except IOError as inst:
	2964		if inst.errno != errno.ENOENT:
	2965		raise
	2966		di = 0
	2967
	2968		return (dd, di)
	2969
	2970		def files(self):
	2971		res = [self.indexfile]
	2972		if not self._inline:
	2973		res.append(self.datafile)
	2974		return res
	2975
	2976		def emitrevisiondeltas(self, requests):
	2977		frev = self.rev
	2978
	2979		prevrev = None
	2980		for request in requests:
	2981		node = request.node
	2982		rev = frev(node)
	2983
	2984		if prevrev is None:
	2985		prevrev = self.index[rev][5]
	2986
	2987		# Requesting a full revision.
	2988		if request.basenode == nullid:
	2989		baserev = nullrev
	2990		# Requesting an explicit revision.
	2991		elif request.basenode is not None:
	2992		baserev = frev(request.basenode)
	2993		# Allowing us to choose.
	2994		else:
	2995		p1rev, p2rev = self.parentrevs(rev)
	2996		deltaparentrev = self.deltaparent(rev)
	2997
	2998		# Avoid sending full revisions when delta parent is null. Pick
	2999		# prev in that case. It's tempting to pick p1 in this case, as
	3000		# p1 will be smaller in the common case. However, computing a
	3001		# delta against p1 may require resolving the raw text of p1,
	3002		# which could be expensive. The revlog caches should have prev
	3003		# cached, meaning less CPU for delta generation. There is
	3004		# likely room to add a flag and/or config option to control this
	3005		# behavior.
	3006		if deltaparentrev == nullrev and self._storedeltachains:
	3007		baserev = prevrev
	3008
	3009		# Revlog is configured to use full snapshot for a reason.
	3010		# Stick to full snapshot.
	3011		elif deltaparentrev == nullrev:
	3012		baserev = nullrev
	3013
	3014		# Pick previous when we can't be sure the base is available
	3015		# on consumer.
	3016		elif deltaparentrev not in (p1rev, p2rev, prevrev):
	3017		baserev = prevrev
	3018		else:
	3019		baserev = deltaparentrev
	3020
	3021		if baserev != nullrev and not self.candelta(baserev, rev):
	3022		baserev = nullrev
	3023
	3024		revision = None
	3025		delta = None
	3026		baserevisionsize = None
	3027
	3028		if self.iscensored(baserev) or self.iscensored(rev):
	3029		try:
	3030		revision = self.revision(node, raw=True)
	3031		except error.CensoredNodeError as e:
	3032		revision = e.tombstone
	3033
	3034		if baserev != nullrev:
	3035		baserevisionsize = self.rawsize(baserev)
	3036
	3037		elif baserev == nullrev:
	3038		revision = self.revision(node, raw=True)
	3039		else:
	3040		delta = self.revdiff(baserev, rev)
	3041
	3042		extraflags = REVIDX_ELLIPSIS if request.ellipsis else 0
	3043
	3044		yield revlogrevisiondelta(
	3045		node=node,
	3046		p1node=request.p1node,
	3047		p2node=request.p2node,
	3048		linknode=request.linknode,
	3049		basenode=self.node(baserev),
	3050		flags=self.flags(rev) \| extraflags,
	3051		baserevisionsize=baserevisionsize,
	3052		revision=revision,
	3053		delta=delta)
	3054
	3055		prevrev = rev
	3056
	3057		DELTAREUSEALWAYS = 'always'
	3058		DELTAREUSESAMEREVS = 'samerevs'
	3059		DELTAREUSENEVER = 'never'
	3060
	3061		DELTAREUSEFULLADD = 'fulladd'
	3062
	3063		DELTAREUSEALL = {'always', 'samerevs', 'never', 'fulladd'}
	3064
	3065		def clone(self, tr, destrevlog, addrevisioncb=None,
	3066		deltareuse=DELTAREUSESAMEREVS, deltabothparents=None):
	3067		"""Copy this revlog to another, possibly with format changes.
	3068
	3069		The destination revlog will contain the same revisions and nodes.
	3070		However, it may not be bit-for-bit identical due to e.g. delta encoding
	3071		differences.
	3072
	3073		The ``deltareuse`` argument control how deltas from the existing revlog
	3074		are preserved in the destination revlog. The argument can have the
	3075		following values:
	3076
	3077		DELTAREUSEALWAYS
	3078		Deltas will always be reused (if possible), even if the destination
	3079		revlog would not select the same revisions for the delta. This is the
	3080		fastest mode of operation.
	3081		DELTAREUSESAMEREVS
	3082		Deltas will be reused if the destination revlog would pick the same
	3083		revisions for the delta. This mode strikes a balance between speed
	3084		and optimization.
	3085		DELTAREUSENEVER
	3086		Deltas will never be reused. This is the slowest mode of execution.
	3087		This mode can be used to recompute deltas (e.g. if the diff/delta
	3088		algorithm changes).
	3089
	3090		Delta computation can be slow, so the choice of delta reuse policy can
	3091		significantly affect run time.
	3092
	3093		The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
	3094		two extremes. Deltas will be reused if they are appropriate. But if the
	3095		delta could choose a better revision, it will do so. This means if you
	3096		are converting a non-generaldelta revlog to a generaldelta revlog,
	3097		deltas will be recomputed if the delta's parent isn't a parent of the
	3098		revision.
	3099
	3100		In addition to the delta policy, the ``deltabothparents`` argument
	3101		controls whether to compute deltas against both parents for merges.
	3102		By default, the current default is used.
	3103		"""
	3104		if deltareuse not in self.DELTAREUSEALL:
	3105		raise ValueError(_('value for deltareuse invalid: %s') % deltareuse)
	3106
	3107		if len(destrevlog):
	3108		raise ValueError(_('destination revlog is not empty'))
	3109
	3110		if getattr(self, 'filteredrevs', None):
	3111		raise ValueError(_('source revlog has filtered revisions'))
	3112		if getattr(destrevlog, 'filteredrevs', None):
	3113		raise ValueError(_('destination revlog has filtered revisions'))
	3114
	3115		# lazydeltabase controls whether to reuse a cached delta, if possible.
	3116		oldlazydeltabase = destrevlog._lazydeltabase
	3117		oldamd = destrevlog._deltabothparents
	3118
	3119		try:
	3120		if deltareuse == self.DELTAREUSEALWAYS:
	3121		destrevlog._lazydeltabase = True
	3122		elif deltareuse == self.DELTAREUSESAMEREVS:
	3123		destrevlog._lazydeltabase = False
	3124
	3125		destrevlog._deltabothparents = deltabothparents or oldamd
	3126
	3127		populatecachedelta = deltareuse in (self.DELTAREUSEALWAYS,
	3128		self.DELTAREUSESAMEREVS)
	3129
	3130		deltacomputer = _deltacomputer(destrevlog)
	3131		index = self.index
	3132		for rev in self:
	3133		entry = index[rev]
	3134
	3135		# Some classes override linkrev to take filtered revs into
	3136		# account. Use raw entry from index.
	3137		flags = entry[0] & 0xffff
	3138		linkrev = entry[4]
	3139		p1 = index[entry[5]][7]
	3140		p2 = index[entry[6]][7]
	3141		node = entry[7]
	3142
	3143		# (Possibly) reuse the delta from the revlog if allowed and
	3144		# the revlog chunk is a delta.
	3145		cachedelta = None
	3146		rawtext = None
	3147		if populatecachedelta:
	3148		dp = self.deltaparent(rev)
	3149		if dp != nullrev:
	3150		cachedelta = (dp, bytes(self._chunk(rev)))
	3151
	3152		if not cachedelta:
	3153		rawtext = self.revision(rev, raw=True)
	3154
	3155
	3156		if deltareuse == self.DELTAREUSEFULLADD:
	3157		destrevlog.addrevision(rawtext, tr, linkrev, p1, p2,
	3158		cachedelta=cachedelta,
	3159		node=node, flags=flags,
	3160		deltacomputer=deltacomputer)
	3161		else:
	3162		ifh = destrevlog.opener(destrevlog.indexfile, 'a+',
	3163		checkambig=False)
	3164		dfh = None
	3165		if not destrevlog._inline:
	3166		dfh = destrevlog.opener(destrevlog.datafile, 'a+')
	3167		try:
	3168		destrevlog._addrevision(node, rawtext, tr, linkrev, p1,
	3169		p2, flags, cachedelta, ifh, dfh,
	3170		deltacomputer=deltacomputer)
	3171		finally:
	3172		if dfh:
	3173		dfh.close()
	3174		ifh.close()
	3175
	3176		if addrevisioncb:
	3177		addrevisioncb(self, rev, node)
	3178		finally:
	3179		destrevlog._lazydeltabase = oldlazydeltabase
	3180		destrevlog._deltabothparents = oldamd

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages