upstream/mercurial-mirror Commit - r41706:bf7fb97a

branchmap: make branchcache responsible for reading...

Martijn Pieters -

r41706:bf7fb97a default

parent child

contrib/perf.py

0 +16 -5

              # perf.py - performance test routines
              '''helper extension to measure performance'''
              # "historical portability" policy of perf.py:
              #
              # We have to do:
              # - make perf.py "loadable" with as wide Mercurial version as possible
              #   This doesn't mean that perf commands work correctly with that Mercurial.
              #   BTW, perf.py itself has been available since 1.1 (or eb240755386d).
              # - make historical perf command work correctly with as wide Mercurial
              #   version as possible
              #
              # We have to do, if possible with reasonable cost:
              # - make recent perf command for historical feature work correctly
              #   with early Mercurial
              #
              # We don't have to do:
              # - make perf command for recent feature work correctly with early
              #   Mercurial
              from __future__ import absolute_import
              import contextlib
              import functools
              import gc
              import os
              import random
              import shutil
              import struct
              import sys
              import tempfile
              import threading
              import time
              from mercurial import (
                  changegroup,
                  cmdutil,
                  commands,
                  copies,
                  error,
                  extensions,
                  hg,
                  mdiff,
                  merge,
                  revlog,
                  util,
              )
              # for "historical portability":
              # try to import modules separately (in dict order), and ignore
              # failure, because these aren't available with early Mercurial
              try:
                  from mercurial import branchmap # since 2.5 (or bcee63733aad)
              except ImportError:
                  pass
              try:
                  from mercurial import obsolete # since 2.3 (or ad0d6c2b3279)
              except ImportError:
                  pass
              try:
                  from mercurial import registrar # since 3.7 (or 37d50250b696)
                  dir(registrar) # forcibly load it
              except ImportError:
                  registrar = None
              try:
                  from mercurial import repoview # since 2.5 (or 3a6ddacb7198)
              except ImportError:
                  pass
              try:
                  from mercurial import scmutil # since 1.9 (or 8b252e826c68)
              except ImportError:
                  pass
              try:
                  from mercurial import setdiscovery # since 1.9 (or cb98fed52495)
              except ImportError:
                  pass
              def identity(a):
                  return a
              try:
                  from mercurial import pycompat
                  getargspec = pycompat.getargspec  # added to module after 4.5
                  _byteskwargs = pycompat.byteskwargs  # since 4.1 (or fbc3f73dc802)
                  _sysstr = pycompat.sysstr         # since 4.0 (or 2219f4f82ede)
                  _xrange = pycompat.xrange         # since 4.8 (or 7eba8f83129b)
                  fsencode = pycompat.fsencode      # since 3.9 (or f4a5e0e86a7e)
                  if pycompat.ispy3:
                      _maxint = sys.maxsize  # per py3 docs for replacing maxint
                  else:
                      _maxint = sys.maxint
              except (ImportError, AttributeError):
                  import inspect
                  getargspec = inspect.getargspec
                  _byteskwargs = identity
                  fsencode = identity               # no py3 support
                  _maxint = sys.maxint              # no py3 support
                  _sysstr = lambda x: x             # no py3 support
                  _xrange = xrange
              try:
                  # 4.7+
                  queue = pycompat.queue.Queue
              except (AttributeError, ImportError):
                  # <4.7.
                  try:
                      queue = pycompat.queue
                  except (AttributeError, ImportError):
                      queue = util.queue
              try:
                  from mercurial import logcmdutil
                  makelogtemplater = logcmdutil.maketemplater
              except (AttributeError, ImportError):
                  try:
                      makelogtemplater = cmdutil.makelogtemplater
                  except (AttributeError, ImportError):
                      makelogtemplater = None
              # for "historical portability":
              # define util.safehasattr forcibly, because util.safehasattr has been
              # available since 1.9.3 (or 94b200a11cf7)
              _undefined = object()
              def safehasattr(thing, attr):
                  return getattr(thing, _sysstr(attr), _undefined) is not _undefined
              setattr(util, 'safehasattr', safehasattr)
              # for "historical portability":
              # define util.timer forcibly, because util.timer has been available
              # since ae5d60bb70c9
              if safehasattr(time, 'perf_counter'):
                  util.timer = time.perf_counter
              elif os.name == b'nt':
                  util.timer = time.clock
              else:
                  util.timer = time.time
              # for "historical portability":
              # use locally defined empty option list, if formatteropts isn't
              # available, because commands.formatteropts has been available since
              # 3.2 (or 7a7eed5176a4), even though formatting itself has been
              # available since 2.2 (or ae5f92e154d3)
              formatteropts = getattr(cmdutil, "formatteropts",
                                      getattr(commands, "formatteropts", []))
              # for "historical portability":
              # use locally defined option list, if debugrevlogopts isn't available,
              # because commands.debugrevlogopts has been available since 3.7 (or
              # 5606f7d0d063), even though cmdutil.openrevlog() has been available
              # since 1.9 (or a79fea6b3e77).
              revlogopts = getattr(cmdutil, "debugrevlogopts",
                                   getattr(commands, "debugrevlogopts", [
                      (b'c', b'changelog', False, (b'open changelog')),
                      (b'm', b'manifest', False, (b'open manifest')),
                      (b'', b'dir', False, (b'open directory manifest')),
                      ]))
              cmdtable = {}
              # for "historical portability":
              # define parsealiases locally, because cmdutil.parsealiases has been
              # available since 1.5 (or 6252852b4332)
              def parsealiases(cmd):
                  return cmd.split(b"|")
              if safehasattr(registrar, 'command'):
                  command = registrar.command(cmdtable)
              elif safehasattr(cmdutil, 'command'):
                  command = cmdutil.command(cmdtable)
                  if b'norepo' not in getargspec(command).args:
                      # for "historical portability":
                      # wrap original cmdutil.command, because "norepo" option has
                      # been available since 3.1 (or 75a96326cecb)
                      _command = command
                      def command(name, options=(), synopsis=None, norepo=False):
                          if norepo:
                              commands.norepo += b' %s' % b' '.join(parsealiases(name))
                          return _command(name, list(options), synopsis)
              else:
                  # for "historical portability":
                  # define "@command" annotation locally, because cmdutil.command
                  # has been available since 1.9 (or 2daa5179e73f)
                  def command(name, options=(), synopsis=None, norepo=False):
                      def decorator(func):
                          if synopsis:
                              cmdtable[name] = func, list(options), synopsis
                          else:
                              cmdtable[name] = func, list(options)
                          if norepo:
                              commands.norepo += b' %s' % b' '.join(parsealiases(name))
                          return func
                      return decorator
              try:
                  import mercurial.registrar
                  import mercurial.configitems
                  configtable = {}
                  configitem = mercurial.registrar.configitem(configtable)
                  configitem(b'perf', b'presleep',
                      default=mercurial.configitems.dynamicdefault,
                  )
                  configitem(b'perf', b'stub',
                      default=mercurial.configitems.dynamicdefault,
                  )
                  configitem(b'perf', b'parentscount',
                      default=mercurial.configitems.dynamicdefault,
                  )
                  configitem(b'perf', b'all-timing',
                      default=mercurial.configitems.dynamicdefault,
                  )
              except (ImportError, AttributeError):
                  pass
              def getlen(ui):
                  if ui.configbool(b"perf", b"stub", False):
                      return lambda x: 1
                  return len
              def gettimer(ui, opts=None):
                  """return a timer function and formatter: (timer, formatter)
                  This function exists to gather the creation of formatter in a single
                  place instead of duplicating it in all performance commands."""
                  # enforce an idle period before execution to counteract power management
                  # experimental config: perf.presleep
                  time.sleep(getint(ui, b"perf", b"presleep", 1))
                  if opts is None:
                      opts = {}
                  # redirect all to stderr unless buffer api is in use
                  if not ui._buffers:
                      ui = ui.copy()
                      uifout = safeattrsetter(ui, b'fout', ignoremissing=True)
                      if uifout:
                          # for "historical portability":
                          # ui.fout/ferr have been available since 1.9 (or 4e1ccd4c2b6d)
                          uifout.set(ui.ferr)
                  # get a formatter
                  uiformatter = getattr(ui, 'formatter', None)
                  if uiformatter:
                      fm = uiformatter(b'perf', opts)
                  else:
                      # for "historical portability":
                      # define formatter locally, because ui.formatter has been
                      # available since 2.2 (or ae5f92e154d3)
                      from mercurial import node
                      class defaultformatter(object):
                          """Minimized composition of baseformatter and plainformatter
                          """
                          def __init__(self, ui, topic, opts):
                              self._ui = ui
                              if ui.debugflag:
                                  self.hexfunc = node.hex
                              else:
                                  self.hexfunc = node.short
                          def __nonzero__(self):
                              return False
                          __bool__ = __nonzero__
                          def startitem(self):
                              pass
                          def data(self, **data):
                              pass
                          def write(self, fields, deftext, *fielddata, **opts):
                              self._ui.write(deftext % fielddata, **opts)
                          def condwrite(self, cond, fields, deftext, *fielddata, **opts):
                              if cond:
                                  self._ui.write(deftext % fielddata, **opts)
                          def plain(self, text, **opts):
                              self._ui.write(text, **opts)
                          def end(self):
                              pass
                      fm = defaultformatter(ui, b'perf', opts)
                  # stub function, runs code only once instead of in a loop
                  # experimental config: perf.stub
                  if ui.configbool(b"perf", b"stub", False):
                      return functools.partial(stub_timer, fm), fm
                  # experimental config: perf.all-timing
                  displayall = ui.configbool(b"perf", b"all-timing", False)
                  return functools.partial(_timer, fm, displayall=displayall), fm
              def stub_timer(fm, func, setup=None, title=None):
                  if setup is not None:
                      setup()
                  func()
              @contextlib.contextmanager
              def timeone():
                  r = []
                  ostart = os.times()
                  cstart = util.timer()
                  yield r
                  cstop = util.timer()
                  ostop = os.times()
                  a, b = ostart, ostop
                  r.append((cstop - cstart, b[0] - a[0], b[1]-a[1]))
              def _timer(fm, func, setup=None, title=None, displayall=False):
                  gc.collect()
                  results = []
                  begin = util.timer()
                  count = 0
                  while True:
                      if setup is not None:
                          setup()
                      with timeone() as item:
                          r = func()
                      count += 1
                      results.append(item[0])
                      cstop = util.timer()
                      if cstop - begin > 3 and count >= 100:
                          break
                      if cstop - begin > 10 and count >= 3:
                          break
                  formatone(fm, results, title=title, result=r,
                            displayall=displayall)
              def formatone(fm, timings, title=None, result=None, displayall=False):
                  count = len(timings)
                  fm.startitem()
                  if title:
                      fm.write(b'title', b'! %s\n', title)
                  if result:
                      fm.write(b'result', b'! result: %s\n', result)
                  def display(role, entry):
                      prefix = b''
                      if role != b'best':
                          prefix = b'%s.' % role
                      fm.plain(b'!')
                      fm.write(prefix + b'wall', b' wall %f', entry[0])
                      fm.write(prefix + b'comb', b' comb %f', entry[1] + entry[2])
                      fm.write(prefix + b'user', b' user %f', entry[1])
                      fm.write(prefix + b'sys',  b' sys %f', entry[2])
                      fm.write(prefix + b'count',  b' (%s of %%d)' % role, count)
                      fm.plain(b'\n')
                  timings.sort()
                  min_val = timings[0]
                  display(b'best', min_val)
                  if displayall:
                      max_val = timings[-1]
                      display(b'max', max_val)
                      avg = tuple([sum(x) / count for x in zip(*timings)])
                      display(b'avg', avg)
                      median = timings[len(timings) // 2]
                      display(b'median', median)
              # utilities for historical portability
              def getint(ui, section, name, default):
                  # for "historical portability":
                  # ui.configint has been available since 1.9 (or fa2b596db182)
                  v = ui.config(section, name, None)
                  if v is None:
                      return default
                  try:
                      return int(v)
                  except ValueError:
                      raise error.ConfigError((b"%s.%s is not an integer ('%s')")
                                              % (section, name, v))
              def safeattrsetter(obj, name, ignoremissing=False):
                  """Ensure that 'obj' has 'name' attribute before subsequent setattr
                  This function is aborted, if 'obj' doesn't have 'name' attribute
                  at runtime. This avoids overlooking removal of an attribute, which
                  breaks assumption of performance measurement, in the future.
                  This function returns the object to (1) assign a new value, and
                  (2) restore an original value to the attribute.
                  If 'ignoremissing' is true, missing 'name' attribute doesn't cause
                  abortion, and this function returns None. This is useful to
                  examine an attribute, which isn't ensured in all Mercurial
                  versions.
                  """
                  if not util.safehasattr(obj, name):
                      if ignoremissing:
                          return None
                      raise error.Abort((b"missing attribute %s of %s might break assumption"
                                         b" of performance measurement") % (name, obj))
                  origvalue = getattr(obj, _sysstr(name))
                  class attrutil(object):
                      def set(self, newvalue):
                          setattr(obj, _sysstr(name), newvalue)
                      def restore(self):
                          setattr(obj, _sysstr(name), origvalue)
                  return attrutil()
              # utilities to examine each internal API changes
              def getbranchmapsubsettable():
                  # for "historical portability":
                  # subsettable is defined in:
                  # - branchmap since 2.9 (or 175c6fd8cacc)
                  # - repoview since 2.5 (or 59a9f18d4587)
                  for mod in (branchmap, repoview):
                      subsettable = getattr(mod, 'subsettable', None)
                      if subsettable:
                          return subsettable
                  # bisecting in bcee63733aad::59a9f18d4587 can reach here (both
                  # branchmap and repoview modules exist, but subsettable attribute
                  # doesn't)
                  raise error.Abort((b"perfbranchmap not available with this Mercurial"),
                                    hint=b"use 2.5 or later")
              def getsvfs(repo):
                  """Return appropriate object to access files under .hg/store
                  """
                  # for "historical portability":
                  # repo.svfs has been available since 2.3 (or 7034365089bf)
                  svfs = getattr(repo, 'svfs', None)
                  if svfs:
                      return svfs
                  else:
                      return getattr(repo, 'sopener')
              def getvfs(repo):
                  """Return appropriate object to access files under .hg
                  """
                  # for "historical portability":
                  # repo.vfs has been available since 2.3 (or 7034365089bf)
                  vfs = getattr(repo, 'vfs', None)
                  if vfs:
                      return vfs
                  else:
                      return getattr(repo, 'opener')
              def repocleartagscachefunc(repo):
                  """Return the function to clear tags cache according to repo internal API
                  """
                  if util.safehasattr(repo, b'_tagscache'): # since 2.0 (or 9dca7653b525)
                      # in this case, setattr(repo, '_tagscache', None) or so isn't
                      # correct way to clear tags cache, because existing code paths
                      # expect _tagscache to be a structured object.
                      def clearcache():
                          # _tagscache has been filteredpropertycache since 2.5 (or
                          # 98c867ac1330), and delattr() can't work in such case
                          if b'_tagscache' in vars(repo):
                              del repo.__dict__[b'_tagscache']
                      return clearcache
                  repotags = safeattrsetter(repo, b'_tags', ignoremissing=True)
                  if repotags: # since 1.4 (or 5614a628d173)
                      return lambda : repotags.set(None)
                  repotagscache = safeattrsetter(repo, b'tagscache', ignoremissing=True)
                  if repotagscache: # since 0.6 (or d7df759d0e97)
                      return lambda : repotagscache.set(None)
                  # Mercurial earlier than 0.6 (or d7df759d0e97) logically reaches
                  # this point, but it isn't so problematic, because:
                  # - repo.tags of such Mercurial isn't "callable", and repo.tags()
                  #   in perftags() causes failure soon
                  # - perf.py itself has been available since 1.1 (or eb240755386d)
                  raise error.Abort((b"tags API of this hg command is unknown"))
              # utilities to clear cache
              def clearfilecache(obj, attrname):
                  unfiltered = getattr(obj, 'unfiltered', None)
                  if unfiltered is not None:
                      obj = obj.unfiltered()
                  if attrname in vars(obj):
                      delattr(obj, attrname)
                  obj._filecache.pop(attrname, None)
              def clearchangelog(repo):
                  if repo is not repo.unfiltered():
                      object.__setattr__(repo, r'_clcachekey', None)
                      object.__setattr__(repo, r'_clcache', None)
                  clearfilecache(repo.unfiltered(), 'changelog')
              # perf commands
              @command(b'perfwalk', formatteropts)
              def perfwalk(ui, repo, *pats, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  m = scmutil.match(repo[None], pats, {})
                  timer(lambda: len(list(repo.dirstate.walk(m, subrepos=[], unknown=True,
                                                            ignored=False))))
                  fm.end()
              @command(b'perfannotate', formatteropts)
              def perfannotate(ui, repo, f, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  fc = repo[b'.'][f]
                  timer(lambda: len(fc.annotate(True)))
                  fm.end()
              @command(b'perfstatus',
                       [(b'u', b'unknown', False,
                         b'ask status to look for unknown files')] + formatteropts)
              def perfstatus(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  #m = match.always(repo.root, repo.getcwd())
                  #timer(lambda: sum(map(len, repo.dirstate.status(m, [], False, False,
                  #                                                False))))
                  timer, fm = gettimer(ui, opts)
                  timer(lambda: sum(map(len, repo.status(unknown=opts[b'unknown']))))
                  fm.end()
              @command(b'perfaddremove', formatteropts)
              def perfaddremove(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  try:
                      oldquiet = repo.ui.quiet
                      repo.ui.quiet = True
                      matcher = scmutil.match(repo[None])
                      opts[b'dry_run'] = True
                      timer(lambda: scmutil.addremove(repo, matcher, b"", opts))
                  finally:
                      repo.ui.quiet = oldquiet
                      fm.end()
              def clearcaches(cl):
                  # behave somewhat consistently across internal API changes
                  if util.safehasattr(cl, b'clearcaches'):
                      cl.clearcaches()
                  elif util.safehasattr(cl, b'_nodecache'):
                      from mercurial.node import nullid, nullrev
                      cl._nodecache = {nullid: nullrev}
                      cl._nodepos = None
              @command(b'perfheads', formatteropts)
              def perfheads(ui, repo, **opts):
                  """benchmark the computation of a changelog heads"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  cl = repo.changelog
                  def s():
                      clearcaches(cl)
                  def d():
                      len(cl.headrevs())
                  timer(d, setup=s)
                  fm.end()
              @command(b'perftags', formatteropts+
                      [
                          (b'', b'clear-revlogs', False, b'refresh changelog and manifest'),
                      ])
              def perftags(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  repocleartagscache = repocleartagscachefunc(repo)
                  clearrevlogs = opts[b'clear_revlogs']
                  def s():
                      if clearrevlogs:
                          clearchangelog(repo)
                          clearfilecache(repo.unfiltered(), 'manifest')
                      repocleartagscache()
                  def t():
                      return len(repo.tags())
                  timer(t, setup=s)
                  fm.end()
              @command(b'perfancestors', formatteropts)
              def perfancestors(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  heads = repo.changelog.headrevs()
                  def d():
                      for a in repo.changelog.ancestors(heads):
                          pass
                  timer(d)
                  fm.end()
              @command(b'perfancestorset', formatteropts)
              def perfancestorset(ui, repo, revset, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  revs = repo.revs(revset)
                  heads = repo.changelog.headrevs()
                  def d():
                      s = repo.changelog.ancestors(heads)
                      for rev in revs:
                          rev in s
                  timer(d)
                  fm.end()
              @command(b'perfdiscovery', formatteropts, b'PATH')
              def perfdiscovery(ui, repo, path, **opts):
                  """benchmark discovery between local repo and the peer at given path
                  """
                  repos = [repo, None]
                  timer, fm = gettimer(ui, opts)
                  path = ui.expandpath(path)
                  def s():
                      repos[1] = hg.peer(ui, opts, path)
                  def d():
                      setdiscovery.findcommonheads(ui, *repos)
                  timer(d, setup=s)
                  fm.end()
              @command(b'perfbookmarks', formatteropts +
                      [
                          (b'', b'clear-revlogs', False, b'refresh changelog and manifest'),
                      ])
              def perfbookmarks(ui, repo, **opts):
                  """benchmark parsing bookmarks from disk to memory"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  clearrevlogs = opts[b'clear_revlogs']
                  def s():
                      if clearrevlogs:
                          clearchangelog(repo)
                      clearfilecache(repo, b'_bookmarks')
                  def d():
                      repo._bookmarks
                  timer(d, setup=s)
                  fm.end()
              @command(b'perfbundleread', formatteropts, b'BUNDLE')
              def perfbundleread(ui, repo, bundlepath, **opts):
                  """Benchmark reading of bundle files.
                  This command is meant to isolate the I/O part of bundle reading as
                  much as possible.
                  """
                  from mercurial import (
                      bundle2,
                      exchange,
                      streamclone,
                  )
                  opts = _byteskwargs(opts)
                  def makebench(fn):
                      def run():
                          with open(bundlepath, b'rb') as fh:
                              bundle = exchange.readbundle(ui, fh, bundlepath)
                              fn(bundle)
                      return run
                  def makereadnbytes(size):
                      def run():
                          with open(bundlepath, b'rb') as fh:
                              bundle = exchange.readbundle(ui, fh, bundlepath)
                              while bundle.read(size):
                                  pass
                      return run
                  def makestdioread(size):
                      def run():
                          with open(bundlepath, b'rb') as fh:
                              while fh.read(size):
                                  pass
                      return run
                  # bundle1
                  def deltaiter(bundle):
                      for delta in bundle.deltaiter():
                          pass
                  def iterchunks(bundle):
                      for chunk in bundle.getchunks():
                          pass
                  # bundle2
                  def forwardchunks(bundle):
                      for chunk in bundle._forwardchunks():
                          pass
                  def iterparts(bundle):
                      for part in bundle.iterparts():
                          pass
                  def iterpartsseekable(bundle):
                      for part in bundle.iterparts(seekable=True):
                          pass
                  def seek(bundle):
                      for part in bundle.iterparts(seekable=True):
                          part.seek(0, os.SEEK_END)
                  def makepartreadnbytes(size):
                      def run():
                          with open(bundlepath, b'rb') as fh:
                              bundle = exchange.readbundle(ui, fh, bundlepath)
                              for part in bundle.iterparts():
                                  while part.read(size):
                                      pass
                      return run
                  benches = [
                      (makestdioread(8192), b'read(8k)'),
                      (makestdioread(16384), b'read(16k)'),
                      (makestdioread(32768), b'read(32k)'),
                      (makestdioread(131072), b'read(128k)'),
                  ]
                  with open(bundlepath, b'rb') as fh:
                      bundle = exchange.readbundle(ui, fh, bundlepath)
                      if isinstance(bundle, changegroup.cg1unpacker):
                          benches.extend([
                              (makebench(deltaiter), b'cg1 deltaiter()'),
                              (makebench(iterchunks), b'cg1 getchunks()'),
                              (makereadnbytes(8192), b'cg1 read(8k)'),
                              (makereadnbytes(16384), b'cg1 read(16k)'),
                              (makereadnbytes(32768), b'cg1 read(32k)'),
                              (makereadnbytes(131072), b'cg1 read(128k)'),
                          ])
                      elif isinstance(bundle, bundle2.unbundle20):
                          benches.extend([
                              (makebench(forwardchunks), b'bundle2 forwardchunks()'),
                              (makebench(iterparts), b'bundle2 iterparts()'),
                              (makebench(iterpartsseekable), b'bundle2 iterparts() seekable'),
                              (makebench(seek), b'bundle2 part seek()'),
                              (makepartreadnbytes(8192), b'bundle2 part read(8k)'),
                              (makepartreadnbytes(16384), b'bundle2 part read(16k)'),
                              (makepartreadnbytes(32768), b'bundle2 part read(32k)'),
                              (makepartreadnbytes(131072), b'bundle2 part read(128k)'),
                          ])
                      elif isinstance(bundle, streamclone.streamcloneapplier):
                          raise error.Abort(b'stream clone bundles not supported')
                      else:
                          raise error.Abort(b'unhandled bundle type: %s' % type(bundle))
                  for fn, title in benches:
                      timer, fm = gettimer(ui, opts)
                      timer(fn, title=title)
                      fm.end()
              @command(b'perfchangegroupchangelog', formatteropts +
                       [(b'', b'cgversion', b'02', b'changegroup version'),
                        (b'r', b'rev', b'', b'revisions to add to changegroup')])
              def perfchangegroupchangelog(ui, repo, cgversion=b'02', rev=None, **opts):
                  """Benchmark producing a changelog group for a changegroup.
                  This measures the time spent processing the changelog during a
                  bundle operation. This occurs during `hg bundle` and on a server
                  processing a `getbundle` wire protocol request (handles clones
                  and pull requests).
                  By default, all revisions are added to the changegroup.
                  """
                  opts = _byteskwargs(opts)
                  cl = repo.changelog
                  nodes = [cl.lookup(r) for r in repo.revs(rev or b'all()')]
                  bundler = changegroup.getbundler(cgversion, repo)
                  def d():
                      state, chunks = bundler._generatechangelog(cl, nodes)
                      for chunk in chunks:
                          pass
                  timer, fm = gettimer(ui, opts)
                  # Terminal printing can interfere with timing. So disable it.
                  with ui.configoverride({(b'progress', b'disable'): True}):
                      timer(d)
                  fm.end()
              @command(b'perfdirs', formatteropts)
              def perfdirs(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  b'a' in dirstate
                  def d():
                      dirstate.hasdir(b'a')
                      del dirstate._map._dirs
                  timer(d)
                  fm.end()
              @command(b'perfdirstate', formatteropts)
              def perfdirstate(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  b"a" in repo.dirstate
                  def d():
                      repo.dirstate.invalidate()
                      b"a" in repo.dirstate
                  timer(d)
                  fm.end()
              @command(b'perfdirstatedirs', formatteropts)
              def perfdirstatedirs(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  b"a" in repo.dirstate
                  def d():
                      repo.dirstate.hasdir(b"a")
                      del repo.dirstate._map._dirs
                  timer(d)
                  fm.end()
              @command(b'perfdirstatefoldmap', formatteropts)
              def perfdirstatefoldmap(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  b'a' in dirstate
                  def d():
                      dirstate._map.filefoldmap.get(b'a')
                      del dirstate._map.filefoldmap
                  timer(d)
                  fm.end()
              @command(b'perfdirfoldmap', formatteropts)
              def perfdirfoldmap(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  b'a' in dirstate
                  def d():
                      dirstate._map.dirfoldmap.get(b'a')
                      del dirstate._map.dirfoldmap
                      del dirstate._map._dirs
                  timer(d)
                  fm.end()
              @command(b'perfdirstatewrite', formatteropts)
              def perfdirstatewrite(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  ds = repo.dirstate
                  b"a" in ds
                  def d():
                      ds._dirty = True
                      ds.write(repo.currenttransaction())
                  timer(d)
                  fm.end()
              @command(b'perfmergecalculate',
                       [(b'r', b'rev', b'.', b'rev to merge against')] + formatteropts)
              def perfmergecalculate(ui, repo, rev, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  wctx = repo[None]
                  rctx = scmutil.revsingle(repo, rev, rev)
                  ancestor = wctx.ancestor(rctx)
                  # we don't want working dir files to be stat'd in the benchmark, so prime
                  # that cache
                  wctx.dirty()
                  def d():
                      # acceptremote is True because we don't want prompts in the middle of
                      # our benchmark
                      merge.calculateupdates(repo, wctx, rctx, [ancestor], False, False,
                                             acceptremote=True, followcopies=True)
                  timer(d)
                  fm.end()
              @command(b'perfpathcopies', [], b"REV REV")
              def perfpathcopies(ui, repo, rev1, rev2, **opts):
                  """benchmark the copy tracing logic"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  ctx1 = scmutil.revsingle(repo, rev1, rev1)
                  ctx2 = scmutil.revsingle(repo, rev2, rev2)
                  def d():
                      copies.pathcopies(ctx1, ctx2)
                  timer(d)
                  fm.end()
              @command(b'perfphases',
                       [(b'', b'full', False, b'include file reading time too'),
                        ], b"")
              def perfphases(ui, repo, **opts):
                  """benchmark phasesets computation"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  _phases = repo._phasecache
                  full = opts.get(b'full')
                  def d():
                      phases = _phases
                      if full:
                          clearfilecache(repo, b'_phasecache')
                          phases = repo._phasecache
                      phases.invalidate()
                      phases.loadphaserevs(repo)
                  timer(d)
                  fm.end()
              @command(b'perfphasesremote',
                       [], b"[DEST]")
              def perfphasesremote(ui, repo, dest=None, **opts):
                  """benchmark time needed to analyse phases of the remote server"""
                  from mercurial.node import (
                      bin,
                  )
                  from mercurial import (
                      exchange,
                      hg,
                      phases,
                  )
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  path = ui.paths.getpath(dest, default=(b'default-push', b'default'))
                  if not path:
                      raise error.Abort((b'default repository not configured!'),
                                        hint=(b"see 'hg help config.paths'"))
                  dest = path.pushloc or path.loc
                  ui.status((b'analysing phase of %s\n') % util.hidepassword(dest))
                  other = hg.peer(repo, opts, dest)
                  # easier to perform discovery through the operation
                  op = exchange.pushoperation(repo, other)
                  exchange._pushdiscoverychangeset(op)
                  remotesubset = op.fallbackheads
                  with other.commandexecutor() as e:
                      remotephases = e.callcommand(b'listkeys',
                                     {b'namespace': b'phases'}).result()
                  del other
                  publishing = remotephases.get(b'publishing', False)
                  if publishing:
                      ui.status((b'publishing: yes\n'))
                  else:
                      ui.status((b'publishing: no\n'))
                  nodemap = repo.changelog.nodemap
                  nonpublishroots = 0
                  for nhex, phase in remotephases.iteritems():
                      if nhex == b'publishing': # ignore data related to publish option
                          continue
                      node = bin(nhex)
                      if node in nodemap and int(phase):
                          nonpublishroots += 1
                  ui.status((b'number of roots: %d\n') % len(remotephases))
                  ui.status((b'number of known non public roots: %d\n') % nonpublishroots)
                  def d():
                      phases.remotephasessummary(repo,
                                                 remotesubset,
                                                 remotephases)
                  timer(d)
                  fm.end()
              @command(b'perfmanifest',[
                          (b'm', b'manifest-rev', False, b'Look up a manifest node revision'),
                          (b'', b'clear-disk', False, b'clear on-disk caches too'),
                       ] + formatteropts, b'REV|NODE')
              def perfmanifest(ui, repo, rev, manifest_rev=False, clear_disk=False, **opts):
                  """benchmark the time to read a manifest from disk and return a usable
                  dict-like object
                  Manifest caches are cleared before retrieval."""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  if not manifest_rev:
                      ctx = scmutil.revsingle(repo, rev, rev)
                      t = ctx.manifestnode()
                  else:
                      from mercurial.node import bin
                      if len(rev) == 40:
                          t = bin(rev)
                      else:
                          try:
                              rev = int(rev)
                              if util.safehasattr(repo.manifestlog, b'getstorage'):
                                  t = repo.manifestlog.getstorage(b'').node(rev)
                              else:
                                  t = repo.manifestlog._revlog.lookup(rev)
                          except ValueError:
                              raise error.Abort(b'manifest revision must be integer or full '
                                                b'node')
                  def d():
                      repo.manifestlog.clearcaches(clear_persisted_data=clear_disk)
                      repo.manifestlog[t].read()
                  timer(d)
                  fm.end()
              @command(b'perfchangeset', formatteropts)
              def perfchangeset(ui, repo, rev, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  n = scmutil.revsingle(repo, rev).node()
                  def d():
                      repo.changelog.read(n)
                      #repo.changelog._cache = None
                  timer(d)
                  fm.end()
              @command(b'perfignore', formatteropts)
              def perfignore(ui, repo, **opts):
                  """benchmark operation related to computing ignore"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  def setupone():
                      dirstate.invalidate()
                      clearfilecache(dirstate, b'_ignore')
                  def runone():
                      dirstate._ignore
                  timer(runone, setup=setupone, title=b"load")
                  fm.end()
              @command(b'perfindex', [
                          (b'', b'rev', [], b'revision to be looked up (default tip)'),
                          (b'', b'no-lookup', None, b'do not revision lookup post creation'),
                       ] + formatteropts)
              def perfindex(ui, repo, **opts):
                  """benchmark index creation time followed by a lookup
                  The default is to look `tip` up. Depending on the index implementation,
                  the revision looked up can matters. For example, an implementation
                  scanning the index will have a faster lookup time for `--rev tip` than for
                  `--rev 0`. The number of looked up revisions and their order can also
                  matters.
                  Example of useful set to test:
                  * tip
                  * 0
                  * -10:
                  * :10
                  * -10: + :10
                  * :10: + -10:
                  * -10000:
                  * -10000: + 0
                  It is not currently possible to check for lookup of a missing node. For
                  deeper lookup benchmarking, checkout the `perfnodemap` command."""
                  import mercurial.revlog
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  mercurial.revlog._prereadsize = 2**24 # disable lazy parser in old hg
                  if opts[b'no_lookup']:
                      if opts['rev']:
                          raise error.Abort('--no-lookup and --rev are mutually exclusive')
                      nodes = []
                  elif not opts[b'rev']:
                      nodes = [repo[b"tip"].node()]
                  else:
                      revs = scmutil.revrange(repo, opts[b'rev'])
                      cl = repo.changelog
                      nodes = [cl.node(r) for r in revs]
                  unfi = repo.unfiltered()
                  # find the filecache func directly
                  # This avoid polluting the benchmark with the filecache logic
                  makecl = unfi.__class__.changelog.func
                  def setup():
                      # probably not necessary, but for good measure
                      clearchangelog(unfi)
                  def d():
                      cl = makecl(unfi)
                      for n in nodes:
                          cl.rev(n)
                  timer(d, setup=setup)
                  fm.end()
              @command(b'perfnodemap', [
                        (b'', b'rev', [], b'revision to be looked up (default tip)'),
                        (b'', b'clear-caches', True, b'clear revlog cache between calls'),
                  ] + formatteropts)
              def perfnodemap(ui, repo, **opts):
                  """benchmark the time necessary to look up revision from a cold nodemap
                  Depending on the implementation, the amount and order of revision we look
                  up can varies. Example of useful set to test:
                  * tip
                  * 0
                  * -10:
                  * :10
                  * -10: + :10
                  * :10: + -10:
                  * -10000:
                  * -10000: + 0
                  The command currently focus on valid binary lookup. Benchmarking for
                  hexlookup, prefix lookup and missing lookup would also be valuable.
                  """
                  import mercurial.revlog
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  mercurial.revlog._prereadsize = 2**24 # disable lazy parser in old hg
                  unfi = repo.unfiltered()
                  clearcaches = opts['clear_caches']
                  # find the filecache func directly
                  # This avoid polluting the benchmark with the filecache logic
                  makecl = unfi.__class__.changelog.func
                  if not opts[b'rev']:
                      raise error.Abort('use --rev to specify revisions to look up')
                  revs = scmutil.revrange(repo, opts[b'rev'])
                  cl = repo.changelog
                  nodes = [cl.node(r) for r in revs]
                  # use a list to pass reference to a nodemap from one closure to the next
                  nodeget = [None]
                  def setnodeget():
                      # probably not necessary, but for good measure
                      clearchangelog(unfi)
                      nodeget[0] = makecl(unfi).nodemap.get
                  def d():
                      get = nodeget[0]
                      for n in nodes:
                          get(n)
                  setup = None
                  if clearcaches:
                      def setup():
                          setnodeget()
                  else:
                      setnodeget()
                      d() # prewarm the data structure
                  timer(d, setup=setup)
                  fm.end()
              @command(b'perfstartup', formatteropts)
              def perfstartup(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  def d():
                      if os.name != r'nt':
                          os.system(b"HGRCPATH= %s version -q > /dev/null" %
                                    fsencode(sys.argv[0]))
                      else:
                          os.environ[r'HGRCPATH'] = r' '
                          os.system(r"%s version -q > NUL" % sys.argv[0])
                  timer(d)
                  fm.end()
              @command(b'perfparents', formatteropts)
              def perfparents(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  # control the number of commits perfparents iterates over
                  # experimental config: perf.parentscount
                  count = getint(ui, b"perf", b"parentscount", 1000)
                  if len(repo.changelog) < count:
                      raise error.Abort(b"repo needs %d commits for this test" % count)
                  repo = repo.unfiltered()
                  nl = [repo.changelog.node(i) for i in _xrange(count)]
                  def d():
                      for n in nl:
                          repo.changelog.parents(n)
                  timer(d)
                  fm.end()
              @command(b'perfctxfiles', formatteropts)
              def perfctxfiles(ui, repo, x, **opts):
                  opts = _byteskwargs(opts)
                  x = int(x)
                  timer, fm = gettimer(ui, opts)
                  def d():
                      len(repo[x].files())
                  timer(d)
                  fm.end()
              @command(b'perfrawfiles', formatteropts)
              def perfrawfiles(ui, repo, x, **opts):
                  opts = _byteskwargs(opts)
                  x = int(x)
                  timer, fm = gettimer(ui, opts)
                  cl = repo.changelog
                  def d():
                      len(cl.read(x)[3])
                  timer(d)
                  fm.end()
              @command(b'perflookup', formatteropts)
              def perflookup(ui, repo, rev, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  timer(lambda: len(repo.lookup(rev)))
                  fm.end()
              @command(b'perflinelogedits',
                       [(b'n', b'edits', 10000, b'number of edits'),
                        (b'', b'max-hunk-lines', 10, b'max lines in a hunk'),
                        ], norepo=True)
              def perflinelogedits(ui, **opts):
                  from mercurial import linelog
                  opts = _byteskwargs(opts)
                  edits = opts[b'edits']
                  maxhunklines = opts[b'max_hunk_lines']
                  maxb1 = 100000
                  random.seed(0)
                  randint = random.randint
                  currentlines = 0
                  arglist = []
                  for rev in _xrange(edits):
                      a1 = randint(0, currentlines)
                      a2 = randint(a1, min(currentlines, a1 + maxhunklines))
                      b1 = randint(0, maxb1)
                      b2 = randint(b1, b1 + maxhunklines)
                      currentlines += (b2 - b1) - (a2 - a1)
                      arglist.append((rev, a1, a2, b1, b2))
                  def d():
                      ll = linelog.linelog()
                      for args in arglist:
                          ll.replacelines(*args)
                  timer, fm = gettimer(ui, opts)
                  timer(d)
                  fm.end()
              @command(b'perfrevrange', formatteropts)
              def perfrevrange(ui, repo, *specs, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  revrange = scmutil.revrange
                  timer(lambda: len(revrange(repo, specs)))
                  fm.end()
              @command(b'perfnodelookup', formatteropts)
              def perfnodelookup(ui, repo, rev, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  import mercurial.revlog
                  mercurial.revlog._prereadsize = 2**24 # disable lazy parser in old hg
                  n = scmutil.revsingle(repo, rev).node()
                  cl = mercurial.revlog.revlog(getsvfs(repo), b"00changelog.i")
                  def d():
                      cl.rev(n)
                      clearcaches(cl)
                  timer(d)
                  fm.end()
              @command(b'perflog',
                       [(b'', b'rename', False, b'ask log to follow renames')
                       ] + formatteropts)
              def perflog(ui, repo, rev=None, **opts):
                  opts = _byteskwargs(opts)
                  if rev is None:
                      rev=[]
                  timer, fm = gettimer(ui, opts)
                  ui.pushbuffer()
                  timer(lambda: commands.log(ui, repo, rev=rev, date=b'', user=b'',
                                             copies=opts.get(b'rename')))
                  ui.popbuffer()
                  fm.end()
              @command(b'perfmoonwalk', formatteropts)
              def perfmoonwalk(ui, repo, **opts):
                  """benchmark walking the changelog backwards
                  This also loads the changelog data for each revision in the changelog.
                  """
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  def moonwalk():
                      for i in repo.changelog.revs(start=(len(repo) - 1), stop=-1):
                          ctx = repo[i]
                          ctx.branch() # read changelog data (in addition to the index)
                  timer(moonwalk)
                  fm.end()
              @command(b'perftemplating',
                       [(b'r', b'rev', [], b'revisions to run the template on'),
                        ] + formatteropts)
              def perftemplating(ui, repo, testedtemplate=None, **opts):
                  """test the rendering time of a given template"""
                  if makelogtemplater is None:
                      raise error.Abort((b"perftemplating not available with this Mercurial"),
                                        hint=b"use 4.3 or later")
                  opts = _byteskwargs(opts)
                  nullui = ui.copy()
                  nullui.fout = open(os.devnull, r'wb')
                  nullui.disablepager()
                  revs = opts.get(b'rev')
                  if not revs:
                      revs = [b'all()']
                  revs = list(scmutil.revrange(repo, revs))
                  defaulttemplate = (b'{date|shortdate} [{rev}:{node|short}]'
                                     b' {author|person}: {desc|firstline}\n')
                  if testedtemplate is None:
                      testedtemplate = defaulttemplate
                  displayer = makelogtemplater(nullui, repo, testedtemplate)
                  def format():
                      for r in revs:
                          ctx = repo[r]
                          displayer.show(ctx)
                          displayer.flush(ctx)
                  timer, fm = gettimer(ui, opts)
                  timer(format)
                  fm.end()
              @command(b'perfhelper-pathcopies', formatteropts +
                       [
                        (b'r', b'revs', [], b'restrict search to these revisions'),
                        (b'', b'timing', False, b'provides extra data (costly)'),
                       ])
              def perfhelperpathcopies(ui, repo, revs=[], **opts):
                  """find statistic about potential parameters for the `perftracecopies`
                  This command find source-destination pair relevant for copytracing testing.
                  It report value for some of the parameters that impact copy tracing time.
                  If `--timing` is set, rename detection is run and the associated timing
                  will be reported. The extra details comes at the cost of a slower command
                  execution.
                  Since the rename detection is only run once, other factors might easily
                  affect the precision of the timing. However it should give a good
                  approximation of which revision pairs are very costly.
                  """
                  opts = _byteskwargs(opts)
                  fm = ui.formatter(b'perf', opts)
                  dotiming = opts[b'timing']
                  if dotiming:
                      header = '%12s %12s %12s %12s %12s %12s\n'
                      output = ("%(source)12s %(destination)12s "
                                "%(nbrevs)12d %(nbmissingfiles)12d "
                                "%(nbrenamedfiles)12d %(time)18.5f\n")
                      header_names = ("source", "destination", "nb-revs", "nb-files",
                                      "nb-renames", "time")
                      fm.plain(header % header_names)
                  else:
                      header = '%12s %12s %12s %12s\n'
                      output = ("%(source)12s %(destination)12s "
                                "%(nbrevs)12d %(nbmissingfiles)12d\n")
                      fm.plain(header % ("source", "destination", "nb-revs", "nb-files"))
                  if not revs:
                      revs = ['all()']
                  revs = scmutil.revrange(repo, revs)
                  roi = repo.revs('merge() and %ld', revs)
                  for r in roi:
                      ctx = repo[r]
                      p1 = ctx.p1().rev()
                      p2 = ctx.p2().rev()
                      bases = repo.changelog._commonancestorsheads(p1, p2)
                      for p in (p1, p2):
                          for b in bases:
                              base = repo[b]
                              parent = repo[p]
                              missing = copies._computeforwardmissing(base, parent)
                              if not missing:
                                  continue
                              data = {
                                  b'source': base.hex(),
                                  b'destination': parent.hex(),
                                  b'nbrevs': len(repo.revs('%d::%d', b, p)),
                                  b'nbmissingfiles': len(missing),
                              }
                              if dotiming:
                                  begin = util.timer()
                                  renames = copies.pathcopies(base, parent)
                                  end = util.timer()
                                  # not very stable timing since we did only one run
                                  data['time'] = end - begin
                                  data['nbrenamedfiles'] = len(renames)
                              fm.startitem()
                              fm.data(**data)
                              out = data.copy()
                              out['source'] = fm.hexfunc(base.node())
                              out['destination'] = fm.hexfunc(parent.node())
                              fm.plain(output % out)
                  fm.end()
              @command(b'perfcca', formatteropts)
              def perfcca(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  timer(lambda: scmutil.casecollisionauditor(ui, False, repo.dirstate))
                  fm.end()
              @command(b'perffncacheload', formatteropts)
              def perffncacheload(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  s = repo.store
                  def d():
                      s.fncache._load()
                  timer(d)
                  fm.end()
              @command(b'perffncachewrite', formatteropts)
              def perffncachewrite(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  s = repo.store
                  lock = repo.lock()
                  s.fncache._load()
                  tr = repo.transaction(b'perffncachewrite')
                  tr.addbackup(b'fncache')
                  def d():
                      s.fncache._dirty = True
                      s.fncache.write(tr)
                  timer(d)
                  tr.close()
                  lock.release()
                  fm.end()
              @command(b'perffncacheencode', formatteropts)
              def perffncacheencode(ui, repo, **opts):
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  s = repo.store
                  s.fncache._load()
                  def d():
                      for p in s.fncache.entries:
                          s.encode(p)
                  timer(d)
                  fm.end()
              def _bdiffworker(q, blocks, xdiff, ready, done):
                  while not done.is_set():
                      pair = q.get()
                      while pair is not None:
                          if xdiff:
                              mdiff.bdiff.xdiffblocks(*pair)
                          elif blocks:
                              mdiff.bdiff.blocks(*pair)
                          else:
                              mdiff.textdiff(*pair)
                          q.task_done()
                          pair = q.get()
                      q.task_done() # for the None one
                      with ready:
                          ready.wait()
              def _manifestrevision(repo, mnode):
                  ml = repo.manifestlog
                  if util.safehasattr(ml, b'getstorage'):
                      store = ml.getstorage(b'')
                  else:
                      store = ml._revlog
                  return store.revision(mnode)
              @command(b'perfbdiff', revlogopts + formatteropts + [
                  (b'', b'count', 1, b'number of revisions to test (when using --startrev)'),
                  (b'', b'alldata', False, b'test bdiffs for all associated revisions'),
                  (b'', b'threads', 0, b'number of thread to use (disable with 0)'),
                  (b'', b'blocks', False, b'test computing diffs into blocks'),
                  (b'', b'xdiff', False, b'use xdiff algorithm'),
                  ],
                  b'-c|-m|FILE REV')
              def perfbdiff(ui, repo, file_, rev=None, count=None, threads=0, **opts):
                  """benchmark a bdiff between revisions
                  By default, benchmark a bdiff between its delta parent and itself.
                  With ``--count``, benchmark bdiffs between delta parents and self for N
                  revisions starting at the specified revision.
                  With ``--alldata``, assume the requested revision is a changeset and
                  measure bdiffs for all changes related to that changeset (manifest
                  and filelogs).
                  """
                  opts = _byteskwargs(opts)
                  if opts[b'xdiff'] and not opts[b'blocks']:
                      raise error.CommandError(b'perfbdiff', b'--xdiff requires --blocks')
                  if opts[b'alldata']:
                      opts[b'changelog'] = True
                  if opts.get(b'changelog') or opts.get(b'manifest'):
                      file_, rev = None, file_
                  elif rev is None:
                      raise error.CommandError(b'perfbdiff', b'invalid arguments')
                  blocks = opts[b'blocks']
                  xdiff = opts[b'xdiff']
                  textpairs = []
                  r = cmdutil.openrevlog(repo, b'perfbdiff', file_, opts)
                  startrev = r.rev(r.lookup(rev))
                  for rev in range(startrev, min(startrev + count, len(r) - 1)):
                      if opts[b'alldata']:
                          # Load revisions associated with changeset.
                          ctx = repo[rev]
                          mtext = _manifestrevision(repo, ctx.manifestnode())
                          for pctx in ctx.parents():
                              pman = _manifestrevision(repo, pctx.manifestnode())
                              textpairs.append((pman, mtext))
                          # Load filelog revisions by iterating manifest delta.
                          man = ctx.manifest()
                          pman = ctx.p1().manifest()
                          for filename, change in pman.diff(man).items():
                              fctx = repo.file(filename)
                              f1 = fctx.revision(change[0][0] or -1)
                              f2 = fctx.revision(change[1][0] or -1)
                              textpairs.append((f1, f2))
                      else:
                          dp = r.deltaparent(rev)
                          textpairs.append((r.revision(dp), r.revision(rev)))
                  withthreads = threads > 0
                  if not withthreads:
                      def d():
                          for pair in textpairs:
                              if xdiff:
                                  mdiff.bdiff.xdiffblocks(*pair)
                              elif blocks:
                                  mdiff.bdiff.blocks(*pair)
                              else:
                                  mdiff.textdiff(*pair)
                  else:
                      q = queue()
                      for i in _xrange(threads):
                          q.put(None)
                      ready = threading.Condition()
                      done = threading.Event()
                      for i in _xrange(threads):
                          threading.Thread(target=_bdiffworker,
                                           args=(q, blocks, xdiff, ready, done)).start()
                      q.join()
                      def d():
                          for pair in textpairs:
                              q.put(pair)
                          for i in _xrange(threads):
                              q.put(None)
                          with ready:
                              ready.notify_all()
                          q.join()
                  timer, fm = gettimer(ui, opts)
                  timer(d)
                  fm.end()
                  if withthreads:
                      done.set()
                      for i in _xrange(threads):
                          q.put(None)
                      with ready:
                          ready.notify_all()
              @command(b'perfunidiff', revlogopts + formatteropts + [
                  (b'', b'count', 1, b'number of revisions to test (when using --startrev)'),
                  (b'', b'alldata', False, b'test unidiffs for all associated revisions'),
                  ], b'-c|-m|FILE REV')
              def perfunidiff(ui, repo, file_, rev=None, count=None, **opts):
                  """benchmark a unified diff between revisions
                  This doesn't include any copy tracing - it's just a unified diff
                  of the texts.
                  By default, benchmark a diff between its delta parent and itself.
                  With ``--count``, benchmark diffs between delta parents and self for N
                  revisions starting at the specified revision.
                  With ``--alldata``, assume the requested revision is a changeset and
                  measure diffs for all changes related to that changeset (manifest
                  and filelogs).
                  """
                  opts = _byteskwargs(opts)
                  if opts[b'alldata']:
                      opts[b'changelog'] = True
                  if opts.get(b'changelog') or opts.get(b'manifest'):
                      file_, rev = None, file_
                  elif rev is None:
                      raise error.CommandError(b'perfunidiff', b'invalid arguments')
                  textpairs = []
                  r = cmdutil.openrevlog(repo, b'perfunidiff', file_, opts)
                  startrev = r.rev(r.lookup(rev))
                  for rev in range(startrev, min(startrev + count, len(r) - 1)):
                      if opts[b'alldata']:
                          # Load revisions associated with changeset.
                          ctx = repo[rev]
                          mtext = _manifestrevision(repo, ctx.manifestnode())
                          for pctx in ctx.parents():
                              pman = _manifestrevision(repo, pctx.manifestnode())
                              textpairs.append((pman, mtext))
                          # Load filelog revisions by iterating manifest delta.
                          man = ctx.manifest()
                          pman = ctx.p1().manifest()
                          for filename, change in pman.diff(man).items():
                              fctx = repo.file(filename)
                              f1 = fctx.revision(change[0][0] or -1)
                              f2 = fctx.revision(change[1][0] or -1)
                              textpairs.append((f1, f2))
                      else:
                          dp = r.deltaparent(rev)
                          textpairs.append((r.revision(dp), r.revision(rev)))
                  def d():
                      for left, right in textpairs:
                          # The date strings don't matter, so we pass empty strings.
                          headerlines, hunks = mdiff.unidiff(
                              left, b'', right, b'', b'left', b'right', binary=False)
                          # consume iterators in roughly the way patch.py does
                          b'\n'.join(headerlines)
                          b''.join(sum((list(hlines) for hrange, hlines in hunks), []))
                  timer, fm = gettimer(ui, opts)
                  timer(d)
                  fm.end()
              @command(b'perfdiffwd', formatteropts)
              def perfdiffwd(ui, repo, **opts):
                  """Profile diff of working directory changes"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  options = {
                      'w': 'ignore_all_space',
                      'b': 'ignore_space_change',
                      'B': 'ignore_blank_lines',
                      }
                  for diffopt in ('', 'w', 'b', 'B', 'wB'):
                      opts = dict((options[c], b'1') for c in diffopt)
                      def d():
                          ui.pushbuffer()
                          commands.diff(ui, repo, **opts)
                          ui.popbuffer()
                      diffopt = diffopt.encode('ascii')
                      title = b'diffopts: %s' % (diffopt and (b'-' + diffopt) or b'none')
                      timer(d, title=title)
                  fm.end()
              @command(b'perfrevlogindex', revlogopts + formatteropts,
                       b'-c|-m|FILE')
              def perfrevlogindex(ui, repo, file_=None, **opts):
                  """Benchmark operations against a revlog index.
                  This tests constructing a revlog instance, reading index data,
                  parsing index data, and performing various operations related to
                  index data.
                  """
                  opts = _byteskwargs(opts)
                  rl = cmdutil.openrevlog(repo, b'perfrevlogindex', file_, opts)
                  opener = getattr(rl, 'opener')  # trick linter
                  indexfile = rl.indexfile
                  data = opener.read(indexfile)
                  header = struct.unpack(b'>I', data[0:4])[0]
                  version = header & 0xFFFF
                  if version == 1:
                      revlogio = revlog.revlogio()
                      inline = header & (1 << 16)
                  else:
                      raise error.Abort((b'unsupported revlog version: %d') % version)
                  rllen = len(rl)
                  node0 = rl.node(0)
                  node25 = rl.node(rllen // 4)
                  node50 = rl.node(rllen // 2)
                  node75 = rl.node(rllen // 4 * 3)
                  node100 = rl.node(rllen - 1)
                  allrevs = range(rllen)
                  allrevsrev = list(reversed(allrevs))
                  allnodes = [rl.node(rev) for rev in range(rllen)]
                  allnodesrev = list(reversed(allnodes))
                  def constructor():
                      revlog.revlog(opener, indexfile)
                  def read():
                      with opener(indexfile) as fh:
                          fh.read()
                  def parseindex():
                      revlogio.parseindex(data, inline)
                  def getentry(revornode):
                      index = revlogio.parseindex(data, inline)[0]
                      index[revornode]
                  def getentries(revs, count=1):
                      index = revlogio.parseindex(data, inline)[0]
                      for i in range(count):
                          for rev in revs:
                              index[rev]
                  def resolvenode(node):
                      nodemap = revlogio.parseindex(data, inline)[1]
                      # This only works for the C code.
                      if nodemap is None:
                          return
                      try:
                          nodemap[node]
                      except error.RevlogError:
                          pass
                  def resolvenodes(nodes, count=1):
                      nodemap = revlogio.parseindex(data, inline)[1]
                      if nodemap is None:
                          return
                      for i in range(count):
                          for node in nodes:
                              try:
                                  nodemap[node]
                              except error.RevlogError:
                                  pass
                  benches = [
                      (constructor, b'revlog constructor'),
                      (read, b'read'),
                      (parseindex, b'create index object'),
                      (lambda: getentry(0), b'retrieve index entry for rev 0'),
                      (lambda: resolvenode(b'a' * 20), b'look up missing node'),
                      (lambda: resolvenode(node0), b'look up node at rev 0'),
                      (lambda: resolvenode(node25), b'look up node at 1/4 len'),
                      (lambda: resolvenode(node50), b'look up node at 1/2 len'),
                      (lambda: resolvenode(node75), b'look up node at 3/4 len'),
                      (lambda: resolvenode(node100), b'look up node at tip'),
                      # 2x variation is to measure caching impact.
                      (lambda: resolvenodes(allnodes),
                       b'look up all nodes (forward)'),
                      (lambda: resolvenodes(allnodes, 2),
                       b'look up all nodes 2x (forward)'),
                      (lambda: resolvenodes(allnodesrev),
                       b'look up all nodes (reverse)'),
                      (lambda: resolvenodes(allnodesrev, 2),
                       b'look up all nodes 2x (reverse)'),
                      (lambda: getentries(allrevs),
                       b'retrieve all index entries (forward)'),
                      (lambda: getentries(allrevs, 2),
                       b'retrieve all index entries 2x (forward)'),
                      (lambda: getentries(allrevsrev),
                       b'retrieve all index entries (reverse)'),
                      (lambda: getentries(allrevsrev, 2),
                       b'retrieve all index entries 2x (reverse)'),
                  ]
                  for fn, title in benches:
                      timer, fm = gettimer(ui, opts)
                      timer(fn, title=title)
                      fm.end()
              @command(b'perfrevlogrevisions', revlogopts + formatteropts +
                       [(b'd', b'dist', 100, b'distance between the revisions'),
                        (b's', b'startrev', 0, b'revision to start reading at'),
                        (b'', b'reverse', False, b'read in reverse')],
                       b'-c|-m|FILE')
              def perfrevlogrevisions(ui, repo, file_=None, startrev=0, reverse=False,
                                      **opts):
                  """Benchmark reading a series of revisions from a revlog.
                  By default, we read every ``-d/--dist`` revision from 0 to tip of
                  the specified revlog.
                  The start revision can be defined via ``-s/--startrev``.
                  """
                  opts = _byteskwargs(opts)
                  rl = cmdutil.openrevlog(repo, b'perfrevlogrevisions', file_, opts)
                  rllen = getlen(ui)(rl)
                  if startrev < 0:
                      startrev = rllen + startrev
                  def d():
                      rl.clearcaches()
                      beginrev = startrev
                      endrev = rllen
                      dist = opts[b'dist']
                      if reverse:
                          beginrev, endrev = endrev - 1, beginrev - 1
                          dist = -1 * dist
                      for x in _xrange(beginrev, endrev, dist):
                          # Old revisions don't support passing int.
                          n = rl.node(x)
                          rl.revision(n)
                  timer, fm = gettimer(ui, opts)
                  timer(d)
                  fm.end()
              @command(b'perfrevlogwrite', revlogopts + formatteropts +
                       [(b's', b'startrev', 1000, b'revision to start writing at'),
                        (b'', b'stoprev', -1, b'last revision to write'),
                        (b'', b'count', 3, b'last revision to write'),
                        (b'', b'details', False, b'print timing for every revisions tested'),
                        (b'', b'source', b'full', b'the kind of data feed in the revlog'),
                        (b'', b'lazydeltabase', True, b'try the provided delta first'),
                        (b'', b'clear-caches', True, b'clear revlog cache between calls'),
                       ],
                       b'-c|-m|FILE')
              def perfrevlogwrite(ui, repo, file_=None, startrev=1000, stoprev=-1, **opts):
                  """Benchmark writing a series of revisions to a revlog.
                  Possible source values are:
                  * `full`: add from a full text (default).
                  * `parent-1`: add from a delta to the first parent
                  * `parent-2`: add from a delta to the second parent if it exists
                                (use a delta from the first parent otherwise)
                  * `parent-smallest`: add from the smallest delta (either p1 or p2)
                  * `storage`: add from the existing precomputed deltas
                  """
                  opts = _byteskwargs(opts)
                  rl = cmdutil.openrevlog(repo, b'perfrevlogwrite', file_, opts)
                  rllen = getlen(ui)(rl)
                  if startrev < 0:
                      startrev = rllen + startrev
                  if stoprev < 0:
                      stoprev = rllen + stoprev
                  lazydeltabase = opts['lazydeltabase']
                  source = opts['source']
                  clearcaches = opts['clear_caches']
                  validsource = (b'full', b'parent-1', b'parent-2', b'parent-smallest',
                                 b'storage')
                  if source not in validsource:
                      raise error.Abort('invalid source type: %s' % source)
                  ### actually gather results
                  count = opts['count']
                  if count <= 0:
                      raise error.Abort('invalide run count: %d' % count)
                  allresults = []
                  for c in range(count):
                      timing = _timeonewrite(ui, rl, source, startrev, stoprev, c + 1,
                                             lazydeltabase=lazydeltabase,
                                             clearcaches=clearcaches)
                      allresults.append(timing)
                  ### consolidate the results in a single list
                  results = []
                  for idx, (rev, t) in enumerate(allresults[0]):
                      ts = [t]
                      for other in allresults[1:]:
                          orev, ot = other[idx]
                          assert orev == rev
                          ts.append(ot)
                      results.append((rev, ts))
                  resultcount = len(results)
                  ### Compute and display relevant statistics
                  # get a formatter
                  fm = ui.formatter(b'perf', opts)
                  displayall = ui.configbool(b"perf", b"all-timing", False)
                  # print individual details if requested
                  if opts['details']:
                      for idx, item in enumerate(results, 1):
                          rev, data = item
                          title = 'revisions #%d of %d, rev %d' % (idx, resultcount, rev)
                          formatone(fm, data, title=title, displayall=displayall)
                  # sorts results by median time
                  results.sort(key=lambda x: sorted(x[1])[len(x[1]) // 2])
                  # list of (name, index) to display)
                  relevants = [
                      ("min", 0),
                      ("10%", resultcount * 10 // 100),
                      ("25%", resultcount * 25 // 100),
                      ("50%", resultcount * 70 // 100),
                      ("75%", resultcount * 75 // 100),
                      ("90%", resultcount * 90 // 100),
                      ("95%", resultcount * 95 // 100),
                      ("99%", resultcount * 99 // 100),
                      ("99.9%", resultcount * 999 // 1000),
                      ("99.99%", resultcount * 9999 // 10000),
                      ("99.999%", resultcount * 99999 // 100000),
                      ("max", -1),
                  ]
                  if not ui.quiet:
                      for name, idx in relevants:
                          data = results[idx]
                          title = '%s of %d, rev %d' % (name, resultcount, data[0])
                          formatone(fm, data[1], title=title, displayall=displayall)
                  # XXX summing that many float will not be very precise, we ignore this fact
                  # for now
                  totaltime = []
                  for item in allresults:
                      totaltime.append((sum(x[1][0] for x in item),
                                        sum(x[1][1] for x in item),
                                        sum(x[1][2] for x in item),)
                      )
                  formatone(fm, totaltime, title="total time (%d revs)" % resultcount,
                            displayall=displayall)
                  fm.end()
              class _faketr(object):
                  def add(s, x, y, z=None):
                      return None
              def _timeonewrite(ui, orig, source, startrev, stoprev, runidx=None,
                                lazydeltabase=True, clearcaches=True):
                  timings = []
                  tr = _faketr()
                  with _temprevlog(ui, orig, startrev) as dest:
                      dest._lazydeltabase = lazydeltabase
                      revs = list(orig.revs(startrev, stoprev))
                      total = len(revs)
                      topic = 'adding'
                      if runidx is not None:
                          topic += ' (run #%d)' % runidx
                       # Support both old and new progress API
                      if util.safehasattr(ui, 'makeprogress'):
                          progress = ui.makeprogress(topic, unit='revs', total=total)
                          def updateprogress(pos):
                              progress.update(pos)
                          def completeprogress():
                              progress.complete()
                      else:
                          def updateprogress(pos):
                              ui.progress(topic, pos, unit='revs', total=total)
                          def completeprogress():
                              ui.progress(topic, None, unit='revs', total=total)
                      for idx, rev in enumerate(revs):
                          updateprogress(idx)
                          addargs, addkwargs = _getrevisionseed(orig, rev, tr, source)
                          if clearcaches:
                              dest.index.clearcaches()
                              dest.clearcaches()
                          with timeone() as r:
                              dest.addrawrevision(*addargs, **addkwargs)
                          timings.append((rev, r[0]))
                      updateprogress(total)
                      completeprogress()
                  return timings
              def _getrevisionseed(orig, rev, tr, source):
                  from mercurial.node import nullid
                  linkrev = orig.linkrev(rev)
                  node = orig.node(rev)
                  p1, p2 = orig.parents(node)
                  flags = orig.flags(rev)
                  cachedelta = None
                  text = None
                  if source == b'full':
                      text = orig.revision(rev)
                  elif source == b'parent-1':
                      baserev = orig.rev(p1)
                      cachedelta = (baserev, orig.revdiff(p1, rev))
                  elif source == b'parent-2':
                      parent = p2
                      if p2 == nullid:
                          parent = p1
                      baserev = orig.rev(parent)
                      cachedelta = (baserev, orig.revdiff(parent, rev))
                  elif source == b'parent-smallest':
                      p1diff = orig.revdiff(p1, rev)
                      parent = p1
                      diff = p1diff
                      if p2 != nullid:
                          p2diff = orig.revdiff(p2, rev)
                          if len(p1diff) > len(p2diff):
                              parent = p2
                              diff = p2diff
                      baserev = orig.rev(parent)
                      cachedelta = (baserev, diff)
                  elif source == b'storage':
                      baserev = orig.deltaparent(rev)
                      cachedelta = (baserev, orig.revdiff(orig.node(baserev), rev))
                  return ((text, tr, linkrev, p1, p2),
                          {'node': node, 'flags': flags, 'cachedelta': cachedelta})
              @contextlib.contextmanager
              def _temprevlog(ui, orig, truncaterev):
                  from mercurial import vfs as vfsmod
                  if orig._inline:
                      raise error.Abort('not supporting inline revlog (yet)')
                  origindexpath = orig.opener.join(orig.indexfile)
                  origdatapath = orig.opener.join(orig.datafile)
                  indexname = 'revlog.i'
                  dataname = 'revlog.d'
                  tmpdir = tempfile.mkdtemp(prefix='tmp-hgperf-')
                  try:
                      # copy the data file in a temporary directory
                      ui.debug('copying data in %s\n' % tmpdir)
                      destindexpath = os.path.join(tmpdir, 'revlog.i')
                      destdatapath = os.path.join(tmpdir, 'revlog.d')
                      shutil.copyfile(origindexpath, destindexpath)
                      shutil.copyfile(origdatapath, destdatapath)
                      # remove the data we want to add again
                      ui.debug('truncating data to be rewritten\n')
                      with open(destindexpath, 'ab') as index:
                          index.seek(0)
                          index.truncate(truncaterev * orig._io.size)
                      with open(destdatapath, 'ab') as data:
                          data.seek(0)
                          data.truncate(orig.start(truncaterev))
                      # instantiate a new revlog from the temporary copy
                      ui.debug('truncating adding to be rewritten\n')
                      vfs = vfsmod.vfs(tmpdir)
                      vfs.options = getattr(orig.opener, 'options', None)
                      dest = revlog.revlog(vfs,
                                           indexfile=indexname,
                                           datafile=dataname)
                      if dest._inline:
                          raise error.Abort('not supporting inline revlog (yet)')
                      # make sure internals are initialized
                      dest.revision(len(dest) - 1)
                      yield dest
                      del dest, vfs
                  finally:
                      shutil.rmtree(tmpdir, True)
              @command(b'perfrevlogchunks', revlogopts + formatteropts +
                       [(b'e', b'engines', b'', b'compression engines to use'),
                        (b's', b'startrev', 0, b'revision to start at')],
                       b'-c|-m|FILE')
              def perfrevlogchunks(ui, repo, file_=None, engines=None, startrev=0, **opts):
                  """Benchmark operations on revlog chunks.
                  Logically, each revlog is a collection of fulltext revisions. However,
                  stored within each revlog are "chunks" of possibly compressed data. This
                  data needs to be read and decompressed or compressed and written.
                  This command measures the time it takes to read+decompress and recompress
                  chunks in a revlog. It effectively isolates I/O and compression performance.
                  For measurements of higher-level operations like resolving revisions,
                  see ``perfrevlogrevisions`` and ``perfrevlogrevision``.
                  """
                  opts = _byteskwargs(opts)
                  rl = cmdutil.openrevlog(repo, b'perfrevlogchunks', file_, opts)
                  # _chunkraw was renamed to _getsegmentforrevs.
                  try:
                      segmentforrevs = rl._getsegmentforrevs
                  except AttributeError:
                      segmentforrevs = rl._chunkraw
                  # Verify engines argument.
                  if engines:
                      engines = set(e.strip() for e in engines.split(b','))
                      for engine in engines:
                          try:
                              util.compressionengines[engine]
                          except KeyError:
                              raise error.Abort(b'unknown compression engine: %s' % engine)
                  else:
                      engines = []
                      for e in util.compengines:
                          engine = util.compengines[e]
                          try:
                              if engine.available():
                                  engine.revlogcompressor().compress(b'dummy')
                                  engines.append(e)
                          except NotImplementedError:
                              pass
                  revs = list(rl.revs(startrev, len(rl) - 1))
                  def rlfh(rl):
                      if rl._inline:
                          return getsvfs(repo)(rl.indexfile)
                      else:
                          return getsvfs(repo)(rl.datafile)
                  def doread():
                      rl.clearcaches()
                      for rev in revs:
                          segmentforrevs(rev, rev)
                  def doreadcachedfh():
                      rl.clearcaches()
                      fh = rlfh(rl)
                      for rev in revs:
                          segmentforrevs(rev, rev, df=fh)
                  def doreadbatch():
                      rl.clearcaches()
                      segmentforrevs(revs[0], revs[-1])
                  def doreadbatchcachedfh():
                      rl.clearcaches()
                      fh = rlfh(rl)
                      segmentforrevs(revs[0], revs[-1], df=fh)
                  def dochunk():
                      rl.clearcaches()
                      fh = rlfh(rl)
                      for rev in revs:
                          rl._chunk(rev, df=fh)
                  chunks = [None]
                  def dochunkbatch():
                      rl.clearcaches()
                      fh = rlfh(rl)
                      # Save chunks as a side-effect.
                      chunks[0] = rl._chunks(revs, df=fh)
                  def docompress(compressor):
                      rl.clearcaches()
                      try:
                          # Swap in the requested compression engine.
                          oldcompressor = rl._compressor
                          rl._compressor = compressor
                          for chunk in chunks[0]:
                              rl.compress(chunk)
                      finally:
                          rl._compressor = oldcompressor
                  benches = [
                      (lambda: doread(), b'read'),
                      (lambda: doreadcachedfh(), b'read w/ reused fd'),
                      (lambda: doreadbatch(), b'read batch'),
                      (lambda: doreadbatchcachedfh(), b'read batch w/ reused fd'),
                      (lambda: dochunk(), b'chunk'),
                      (lambda: dochunkbatch(), b'chunk batch'),
                  ]
                  for engine in sorted(engines):
                      compressor = util.compengines[engine].revlogcompressor()
                      benches.append((functools.partial(docompress, compressor),
                                      b'compress w/ %s' % engine))
                  for fn, title in benches:
                      timer, fm = gettimer(ui, opts)
                      timer(fn, title=title)
                      fm.end()
              @command(b'perfrevlogrevision', revlogopts + formatteropts +
                       [(b'', b'cache', False, b'use caches instead of clearing')],
                       b'-c|-m|FILE REV')
              def perfrevlogrevision(ui, repo, file_, rev=None, cache=None, **opts):
                  """Benchmark obtaining a revlog revision.
                  Obtaining a revlog revision consists of roughly the following steps:
 . Compute the delta chain
 . Slice the delta chain if applicable
 . Obtain the raw chunks for that delta chain
 . Decompress each raw chunk
 . Apply binary patches to obtain fulltext
 . Verify hash of fulltext
                  This command measures the time spent in each of these phases.
                  """
                  opts = _byteskwargs(opts)
                  if opts.get(b'changelog') or opts.get(b'manifest'):
                      file_, rev = None, file_
                  elif rev is None:
                      raise error.CommandError(b'perfrevlogrevision', b'invalid arguments')
                  r = cmdutil.openrevlog(repo, b'perfrevlogrevision', file_, opts)
                  # _chunkraw was renamed to _getsegmentforrevs.
                  try:
                      segmentforrevs = r._getsegmentforrevs
                  except AttributeError:
                      segmentforrevs = r._chunkraw
                  node = r.lookup(rev)
                  rev = r.rev(node)
                  def getrawchunks(data, chain):
                      start = r.start
                      length = r.length
                      inline = r._inline
                      iosize = r._io.size
                      buffer = util.buffer
                      chunks = []
                      ladd = chunks.append
                      for idx, item in enumerate(chain):
                          offset = start(item[0])
                          bits = data[idx]
                          for rev in item:
                              chunkstart = start(rev)
                              if inline:
                                  chunkstart += (rev + 1) * iosize
                              chunklength = length(rev)
                              ladd(buffer(bits, chunkstart - offset, chunklength))
                      return chunks
                  def dodeltachain(rev):
                      if not cache:
                          r.clearcaches()
                      r._deltachain(rev)
                  def doread(chain):
                      if not cache:
                          r.clearcaches()
                      for item in slicedchain:
                          segmentforrevs(item[0], item[-1])
                  def doslice(r, chain, size):
                      for s in slicechunk(r, chain, targetsize=size):
                          pass
                  def dorawchunks(data, chain):
                      if not cache:
                          r.clearcaches()
                      getrawchunks(data, chain)
                  def dodecompress(chunks):
                      decomp = r.decompress
                      for chunk in chunks:
                          decomp(chunk)
                  def dopatch(text, bins):
                      if not cache:
                          r.clearcaches()
                      mdiff.patches(text, bins)
                  def dohash(text):
                      if not cache:
                          r.clearcaches()
                      r.checkhash(text, node, rev=rev)
                  def dorevision():
                      if not cache:
                          r.clearcaches()
                      r.revision(node)
                  try:
                      from mercurial.revlogutils.deltas import slicechunk
                  except ImportError:
                      slicechunk = getattr(revlog, '_slicechunk', None)
                  size = r.length(rev)
                  chain = r._deltachain(rev)[0]
                  if not getattr(r, '_withsparseread', False):
                      slicedchain = (chain,)
                  else:
                      slicedchain = tuple(slicechunk(r, chain, targetsize=size))
                  data = [segmentforrevs(seg[0], seg[-1])[1] for seg in slicedchain]
                  rawchunks = getrawchunks(data, slicedchain)
                  bins = r._chunks(chain)
                  text = bytes(bins[0])
                  bins = bins[1:]
                  text = mdiff.patches(text, bins)
                  benches = [
                      (lambda: dorevision(), b'full'),
                      (lambda: dodeltachain(rev), b'deltachain'),
                      (lambda: doread(chain), b'read'),
                  ]
                  if getattr(r, '_withsparseread', False):
                      slicing = (lambda: doslice(r, chain, size), b'slice-sparse-chain')
                      benches.append(slicing)
                  benches.extend([
                      (lambda: dorawchunks(data, slicedchain), b'rawchunks'),
                      (lambda: dodecompress(rawchunks), b'decompress'),
                      (lambda: dopatch(text, bins), b'patch'),
                      (lambda: dohash(text), b'hash'),
                  ])
                  timer, fm = gettimer(ui, opts)
                  for fn, title in benches:
                      timer(fn, title=title)
                  fm.end()
              @command(b'perfrevset',
                       [(b'C', b'clear', False, b'clear volatile cache between each call.'),
                        (b'', b'contexts', False, b'obtain changectx for each revision')]
                       + formatteropts, b"REVSET")
              def perfrevset(ui, repo, expr, clear=False, contexts=False, **opts):
                  """benchmark the execution time of a revset
                  Use the --clean option if need to evaluate the impact of build volatile
                  revisions set cache on the revset execution. Volatile cache hold filtered
                  and obsolete related cache."""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  def d():
                      if clear:
                          repo.invalidatevolatilesets()
                      if contexts:
                          for ctx in repo.set(expr): pass
                      else:
                          for r in repo.revs(expr): pass
                  timer(d)
                  fm.end()
              @command(b'perfvolatilesets',
                       [(b'', b'clear-obsstore', False, b'drop obsstore between each call.'),
                        ] + formatteropts)
              def perfvolatilesets(ui, repo, *names, **opts):
                  """benchmark the computation of various volatile set
                  Volatile set computes element related to filtering and obsolescence."""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  repo = repo.unfiltered()
                  def getobs(name):
                      def d():
                          repo.invalidatevolatilesets()
                          if opts[b'clear_obsstore']:
                              clearfilecache(repo, b'obsstore')
                          obsolete.getrevs(repo, name)
                      return d
                  allobs = sorted(obsolete.cachefuncs)
                  if names:
                      allobs = [n for n in allobs if n in names]
                  for name in allobs:
                      timer(getobs(name), title=name)
                  def getfiltered(name):
                      def d():
                          repo.invalidatevolatilesets()
                          if opts[b'clear_obsstore']:
                              clearfilecache(repo, b'obsstore')
                          repoview.filterrevs(repo, name)
                      return d
                  allfilter = sorted(repoview.filtertable)
                  if names:
                      allfilter = [n for n in allfilter if n in names]
                  for name in allfilter:
                      timer(getfiltered(name), title=name)
                  fm.end()
              @command(b'perfbranchmap',
                       [(b'f', b'full', False,
                         b'Includes build time of subset'),
                        (b'', b'clear-revbranch', False,
                         b'purge the revbranch cache between computation'),
                        ] + formatteropts)
              def perfbranchmap(ui, repo, *filternames, **opts):
                  """benchmark the update of a branchmap
                  This benchmarks the full repo.branchmap() call with read and write disabled
                  """
                  opts = _byteskwargs(opts)
                  full = opts.get(b"full", False)
                  clear_revbranch = opts.get(b"clear_revbranch", False)
                  timer, fm = gettimer(ui, opts)
                  def getbranchmap(filtername):
                      """generate a benchmark function for the filtername"""
                      if filtername is None:
                          view = repo
                      else:
                          view = repo.filtered(filtername)
                      def d():
                          if clear_revbranch:
                              repo.revbranchcache()._clear()
                          if full:
                              view._branchcaches.clear()
                          else:
                              view._branchcaches.pop(filtername, None)
                          view.branchmap()
                      return d
                  # add filter in smaller subset to bigger subset
                  possiblefilters = set(repoview.filtertable)
                  if filternames:
                      possiblefilters &= set(filternames)
                  subsettable = getbranchmapsubsettable()
                  allfilters = []
                  while possiblefilters:
                      for name in possiblefilters:
                          subset = subsettable.get(name)
                          if subset not in possiblefilters:
                              break
                      else:
                          assert False, b'subset cycle %s!' % possiblefilters
                      allfilters.append(name)
                      possiblefilters.remove(name)
                  # warm the cache
                  if not full:
                      for name in allfilters:
                          repo.filtered(name).branchmap()
                  if not filternames or b'unfiltered' in filternames:
                      # add unfiltered
                      allfilters.append(None)
-                 branchcacheread = safeattrsetter(branchmap, b'read')
+                 if util.safehasattr(branchmap.branchcache, 'fromfile'):
+                     branchcacheread = safeattrsetter(branchmap.branchcache, b'fromfile')
+                     branchcacheread.set(classmethod(lambda *args: None))
+                 else:
+                     # older versions
+                     branchcacheread = safeattrsetter(branchmap, b'read')
+                     branchcacheread.set(lambda *args: None)
                  branchcachewrite = safeattrsetter(branchmap.branchcache, b'write')
-                 branchcacheread.set(lambda repo: None)
-                 branchcachewrite.set(lambda bc, repo: None)
+                 branchcachewrite.set(lambda *args: None)
                  try:
                      for name in allfilters:
                          printname = name
                          if name is None:
                              printname = b'unfiltered'
                          timer(getbranchmap(name), title=str(printname))
                  finally:
                      branchcacheread.restore()
                      branchcachewrite.restore()
                  fm.end()
              @command(b'perfbranchmapupdate', [
                   (b'', b'base', [], b'subset of revision to start from'),
                   (b'', b'target', [], b'subset of revision to end with'),
                   (b'', b'clear-caches', False, b'clear cache between each runs')
                  ] + formatteropts)
              def perfbranchmapupdate(ui, repo, base=(), target=(), **opts):
                  """benchmark branchmap update from for <base> revs to <target> revs
                  If `--clear-caches` is passed, the following items will be reset before
                  each update:
                      * the changelog instance and associated indexes
                      * the rev-branch-cache instance
                  Examples:
                     # update for the one last revision
                     $ hg perfbranchmapupdate --base 'not tip' --target 'tip'
                     $ update for change coming with a new branch
                     $ hg perfbranchmapupdate --base 'stable' --target 'default'
                  """
                  from mercurial import branchmap
                  from mercurial import repoview
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  clearcaches = opts[b'clear_caches']
                  unfi = repo.unfiltered()
                  x = [None] # used to pass data between closure
                  # we use a `list` here to avoid possible side effect from smartset
                  baserevs = list(scmutil.revrange(repo, base))
                  targetrevs = list(scmutil.revrange(repo, target))
                  if not baserevs:
                      raise error.Abort(b'no revisions selected for --base')
                  if not targetrevs:
                      raise error.Abort(b'no revisions selected for --target')
                  # make sure the target branchmap also contains the one in the base
                  targetrevs = list(set(baserevs) | set(targetrevs))
                  targetrevs.sort()
                  cl = repo.changelog
                  allbaserevs = list(cl.ancestors(baserevs, inclusive=True))
                  allbaserevs.sort()
                  alltargetrevs = frozenset(cl.ancestors(targetrevs, inclusive=True))
                  newrevs = list(alltargetrevs.difference(allbaserevs))
                  newrevs.sort()
                  allrevs = frozenset(unfi.changelog.revs())
                  basefilterrevs = frozenset(allrevs.difference(allbaserevs))
                  targetfilterrevs = frozenset(allrevs.difference(alltargetrevs))
                  def basefilter(repo, visibilityexceptions=None):
                      return basefilterrevs
                  def targetfilter(repo, visibilityexceptions=None):
                      return targetfilterrevs
                  msg = b'benchmark of branchmap with %d revisions with %d new ones\n'
                  ui.status(msg % (len(allbaserevs), len(newrevs)))
                  if targetfilterrevs:
                      msg = b'(%d revisions still filtered)\n'
                      ui.status(msg % len(targetfilterrevs))
                  try:
                      repoview.filtertable[b'__perf_branchmap_update_base'] = basefilter
                      repoview.filtertable[b'__perf_branchmap_update_target'] = targetfilter
                      baserepo = repo.filtered(b'__perf_branchmap_update_base')
                      targetrepo = repo.filtered(b'__perf_branchmap_update_target')
                      # try to find an existing branchmap to reuse
                      subsettable = getbranchmapsubsettable()
                      candidatefilter = subsettable.get(None)
                      while candidatefilter is not None:
                          candidatebm = repo.filtered(candidatefilter).branchmap()
                          if candidatebm.validfor(baserepo):
                              filtered = repoview.filterrevs(repo, candidatefilter)
                              missing = [r for r in allbaserevs if r in filtered]
                              base = candidatebm.copy()
                              base.update(baserepo, missing)
                              break
                          candidatefilter = subsettable.get(candidatefilter)
                      else:
                          # no suitable subset where found
                          base = branchmap.branchcache()
                          base.update(baserepo, allbaserevs)
                      def setup():
                          x[0] = base.copy()
                          if clearcaches:
                              unfi._revbranchcache = None
                              clearchangelog(repo)
                      def bench():
                          x[0].update(targetrepo, newrevs)
                      timer(bench, setup=setup)
                      fm.end()
                  finally:
                      repoview.filtertable.pop(b'__perf_branchmap_update_base', None)
                      repoview.filtertable.pop(b'__perf_branchmap_update_target', None)
              @command(b'perfbranchmapload', [
                   (b'f', b'filter', b'', b'Specify repoview filter'),
                   (b'', b'list', False, b'List brachmap filter caches'),
                   (b'', b'clear-revlogs', False, b'refresh changelog and manifest'),
                  ] + formatteropts)
              def perfbranchmapload(ui, repo, filter=b'', list=False, **opts):
                  """benchmark reading the branchmap"""
                  opts = _byteskwargs(opts)
                  clearrevlogs = opts[b'clear_revlogs']
                  if list:
                      for name, kind, st in repo.cachevfs.readdir(stat=True):
                          if name.startswith(b'branch2'):
                              filtername = name.partition(b'-')[2] or b'unfiltered'
                              ui.status(b'%s - %s\n'
                                        % (filtername, util.bytecount(st.st_size)))
                      return
                  if not filter:
                      filter = None
                  subsettable = getbranchmapsubsettable()
                  if filter is None:
                      repo = repo.unfiltered()
                  else:
                      repo = repoview.repoview(repo, filter)
                  repo.branchmap() # make sure we have a relevant, up to date branchmap
+                 try:
+                     fromfile = branchmap.branchcache.fromfile
+                 except AttributeError:
+                     # older versions
+                     fromfile = branchmap.read
                  currentfilter = filter
                  # try once without timer, the filter may not be cached
-                 while branchmap.read(repo) is None:
+                 while fromfile(repo) is None:
                      currentfilter = subsettable.get(currentfilter)
                      if currentfilter is None:
                          raise error.Abort(b'No branchmap cached for %s repo'
                                            % (filter or b'unfiltered'))
                      repo = repo.filtered(currentfilter)
                  timer, fm = gettimer(ui, opts)
                  def setup():
                      if clearrevlogs:
                          clearchangelog(repo)
                  def bench():
-                     branchmap.read(repo)
+                     fromfile(repo)
                  timer(bench, setup=setup)
                  fm.end()
              @command(b'perfloadmarkers')
              def perfloadmarkers(ui, repo):
                  """benchmark the time to parse the on-disk markers for a repo
                  Result is the number of markers in the repo."""
                  timer, fm = gettimer(ui)
                  svfs = getsvfs(repo)
                  timer(lambda: len(obsolete.obsstore(svfs)))
                  fm.end()
              @command(b'perflrucachedict', formatteropts +
                  [(b'', b'costlimit', 0, b'maximum total cost of items in cache'),
                   (b'', b'mincost', 0, b'smallest cost of items in cache'),
                   (b'', b'maxcost', 100, b'maximum cost of items in cache'),
                   (b'', b'size', 4, b'size of cache'),
                   (b'', b'gets', 10000, b'number of key lookups'),
                   (b'', b'sets', 10000, b'number of key sets'),
                   (b'', b'mixed', 10000, b'number of mixed mode operations'),
                   (b'', b'mixedgetfreq', 50, b'frequency of get vs set ops in mixed mode')],
                  norepo=True)
              def perflrucache(ui, mincost=0, maxcost=100, costlimit=0, size=4,
                               gets=10000, sets=10000, mixed=10000, mixedgetfreq=50, **opts):
                  opts = _byteskwargs(opts)
                  def doinit():
                      for i in _xrange(10000):
                          util.lrucachedict(size)
                  costrange = list(range(mincost, maxcost + 1))
                  values = []
                  for i in _xrange(size):
                      values.append(random.randint(0, _maxint))
                  # Get mode fills the cache and tests raw lookup performance with no
                  # eviction.
                  getseq = []
                  for i in _xrange(gets):
                      getseq.append(random.choice(values))
                  def dogets():
                      d = util.lrucachedict(size)
                      for v in values:
                          d[v] = v
                      for key in getseq:
                          value = d[key]
                          value # silence pyflakes warning
                  def dogetscost():
                      d = util.lrucachedict(size, maxcost=costlimit)
                      for i, v in enumerate(values):
                          d.insert(v, v, cost=costs[i])
                      for key in getseq:
                          try:
                              value = d[key]
                              value # silence pyflakes warning
                          except KeyError:
                              pass
                  # Set mode tests insertion speed with cache eviction.
                  setseq = []
                  costs = []
                  for i in _xrange(sets):
                      setseq.append(random.randint(0, _maxint))
                      costs.append(random.choice(costrange))
                  def doinserts():
                      d = util.lrucachedict(size)
                      for v in setseq:
                          d.insert(v, v)
                  def doinsertscost():
                      d = util.lrucachedict(size, maxcost=costlimit)
                      for i, v in enumerate(setseq):
                          d.insert(v, v, cost=costs[i])
                  def dosets():
                      d = util.lrucachedict(size)
                      for v in setseq:
                          d[v] = v
                  # Mixed mode randomly performs gets and sets with eviction.
                  mixedops = []
                  for i in _xrange(mixed):
                      r = random.randint(0, 100)
                      if r < mixedgetfreq:
                          op = 0
                      else:
                          op = 1
                      mixedops.append((op,
                                       random.randint(0, size * 2),
                                       random.choice(costrange)))
                  def domixed():
                      d = util.lrucachedict(size)
                      for op, v, cost in mixedops:
                          if op == 0:
                              try:
                                  d[v]
                              except KeyError:
                                  pass
                          else:
                              d[v] = v
                  def domixedcost():
                      d = util.lrucachedict(size, maxcost=costlimit)
                      for op, v, cost in mixedops:
                          if op == 0:
                              try:
                                  d[v]
                              except KeyError:
                                  pass
                          else:
                              d.insert(v, v, cost=cost)
                  benches = [
                      (doinit, b'init'),
                  ]
                  if costlimit:
                      benches.extend([
                          (dogetscost, b'gets w/ cost limit'),
                          (doinsertscost, b'inserts w/ cost limit'),
                          (domixedcost, b'mixed w/ cost limit'),
                      ])
                  else:
                      benches.extend([
                          (dogets, b'gets'),
                          (doinserts, b'inserts'),
                          (dosets, b'sets'),
                          (domixed, b'mixed')
                      ])
                  for fn, title in benches:
                      timer, fm = gettimer(ui, opts)
                      timer(fn, title=title)
                      fm.end()
              @command(b'perfwrite', formatteropts)
              def perfwrite(ui, repo, **opts):
                  """microbenchmark ui.write
                  """
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  def write():
                      for i in range(100000):
                          ui.write((b'Testing write performance\n'))
                  timer(write)
                  fm.end()
              def uisetup(ui):
                  if (util.safehasattr(cmdutil, b'openrevlog') and
                      not util.safehasattr(commands, b'debugrevlogopts')):
                      # for "historical portability":
                      # In this case, Mercurial should be 1.9 (or a79fea6b3e77) -
                      # 3.7 (or 5606f7d0d063). Therefore, '--dir' option for
                      # openrevlog() should cause failure, because it has been
                      # available since 3.5 (or 49c583ca48c4).
                      def openrevlog(orig, repo, cmd, file_, opts):
                          if opts.get(b'dir') and not util.safehasattr(repo, b'dirlog'):
                              raise error.Abort(b"This version doesn't support --dir option",
                                                hint=b"use 3.5 or later")
                          return orig(repo, cmd, file_, opts)
                      extensions.wrapfunction(cmdutil, b'openrevlog', openrevlog)
              @command(b'perfprogress', formatteropts + [
                  (b'', b'topic', b'topic', b'topic for progress messages'),
                  (b'c', b'total', 1000000, b'total value we are progressing to'),
              ], norepo=True)
              def perfprogress(ui, topic=None, total=None, **opts):
                  """printing of progress bars"""
                  opts = _byteskwargs(opts)
                  timer, fm = gettimer(ui, opts)
                  def doprogress():
                      with ui.makeprogress(topic, total=total) as progress:
                          for i in pycompat.xrange(total):
                              progress.increment()
                  timer(doprogress)
                  fm.end()

mercurial/branchmap.py

0 +60 -59

              # branchmap.py - logic to computes, maintain and stores branchmap for local repo
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import struct
              from .node import (
                  bin,
                  hex,
                  nullid,
                  nullrev,
              )
              from . import (
                  encoding,
                  error,
                  pycompat,
                  scmutil,
                  util,
              )
              from .utils import (
                  stringutil,
              )
              calcsize = struct.calcsize
              pack_into = struct.pack_into
              unpack_from = struct.unpack_from
-             def _filename(repo):
-                 """name of a branchcache file for a given repo or repoview"""
-                 filename = "branch2"
-                 if repo.filtername:
-                     filename = '%s-%s' % (filename, repo.filtername)
-                 return filename
-             def read(repo):
-                 f = None
-                 try:
-                     f = repo.cachevfs(_filename(repo))
-                     lineiter = iter(f)
-                     cachekey = next(lineiter).rstrip('\n').split(" ", 2)
-                     last, lrev = cachekey[:2]
-                     last, lrev = bin(last), int(lrev)
-                     filteredhash = None
-                     if len(cachekey) > 2:
-                         filteredhash = bin(cachekey[2])
-                     bcache = branchcache(tipnode=last, tiprev=lrev,
-                                           filteredhash=filteredhash)
-                     if not bcache.validfor(repo):
-                         # invalidate the cache
-                         raise ValueError(r'tip differs')
-                     cl = repo.changelog
-                     for l in lineiter:
-                         l = l.rstrip('\n')
-                         if not l:
-                             continue
-                         node, state, label = l.split(" ", 2)
-                         if state not in 'oc':
-                             raise ValueError(r'invalid branch state')
-                         label = encoding.tolocal(label.strip())
-                         node = bin(node)
-                         if not cl.hasnode(node):
-                             raise ValueError(
-                                 r'node %s does not exist' % pycompat.sysstr(hex(node)))
-                         bcache.setdefault(label, []).append(node)
-                         if state == 'c':
-                             bcache._closednodes.add(node)
-                 except (IOError, OSError):
-                     return None
-                 except Exception as inst:
-                     if repo.ui.debugflag:
-                         msg = 'invalid branchheads cache'
-                         if repo.filtername is not None:
-                             msg += ' (%s)' % repo.filtername
-                         msg += ': %s\n'
-                         repo.ui.debug(msg % pycompat.bytestr(inst))
-                     bcache = None
-                 finally:
-                     if f:
-                         f.close()
-                 return bcache
              ### Nearest subset relation
              # Nearest subset of filter X is a filter Y so that:
              # * Y is included in X,
              # * X - Y is as small as possible.
              # This create and ordering used for branchmap purpose.
              # the ordering may be partial
              subsettable = {None: 'visible',
                             'visible-hidden': 'visible',
                             'visible': 'served',
                             'served': 'immutable',
                             'immutable': 'base'}
              def updatecache(repo):
                  cl = repo.changelog
                  filtername = repo.filtername
                  bcache = repo._branchcaches.get(filtername)
                  revs = []
                  if bcache is None or not bcache.validfor(repo):
-                     bcache = read(repo)
+                     bcache = branchcache.fromfile(repo)
                      if bcache is None:
                          subsetname = subsettable.get(filtername)
                          if subsetname is None:
                              bcache = branchcache()
                          else:
                              subset = repo.filtered(subsetname)
                              bcache = subset.branchmap().copy()
                              extrarevs = subset.changelog.filteredrevs - cl.filteredrevs
                              revs.extend(r for  r in extrarevs if r <= bcache.tiprev)
                  revs.extend(cl.revs(start=bcache.tiprev + 1))
                  if revs:
                      bcache.update(repo, revs)
                      bcache.write(repo)
                  assert bcache.validfor(repo), filtername
                  repo._branchcaches[repo.filtername] = bcache
              def replacecache(repo, bm):
                  """Replace the branchmap cache for a repo with a branch mapping.
                  This is likely only called during clone with a branch map from a remote.
                  """
                  cl = repo.changelog
                  clrev = cl.rev
                  clbranchinfo = cl.branchinfo
                  rbheads = []
                  closed = []
                  for bheads in bm.itervalues():
                      rbheads.extend(bheads)
                      for h in bheads:
                          r = clrev(h)
                          b, c = clbranchinfo(r)
                          if c:
                              closed.append(h)
                  if rbheads:
                      rtiprev = max((int(clrev(node))
                              for node in rbheads))
                      cache = branchcache(bm,
                                          repo[rtiprev].node(),
                                          rtiprev,
                                          closednodes=closed)
                      # Try to stick it as low as possible
                      # filter above served are unlikely to be fetch from a clone
                      for candidate in ('base', 'immutable', 'served'):
                          rview = repo.filtered(candidate)
                          if cache.validfor(rview):
                              repo._branchcaches[candidate] = cache
                              cache.write(rview)
                              break
              class branchcache(dict):
                  """A dict like object that hold branches heads cache.
                  This cache is used to avoid costly computations to determine all the
                  branch heads of a repo.
                  The cache is serialized on disk in the following format:
                  <tip hex node> <tip rev number> [optional filtered repo hex hash]
                  <branch head hex node> <open/closed state> <branch name>
                  <branch head hex node> <open/closed state> <branch name>
                  ...
                  The first line is used to check if the cache is still valid. If the
                  branch cache is for a filtered repo view, an optional third hash is
                  included that hashes the hashes of all filtered revisions.
                  The open/closed state is represented by a single letter 'o' or 'c'.
                  This field can be used to avoid changelog reads when determining if a
                  branch head closes a branch or not.
                  """
+                 @classmethod
+                 def fromfile(cls, repo):
+                     f = None
+                     try:
+                         f = repo.cachevfs(cls._filename(repo))
+                         lineiter = iter(f)
+                         cachekey = next(lineiter).rstrip('\n').split(" ", 2)
+                         last, lrev = cachekey[:2]
+                         last, lrev = bin(last), int(lrev)
+                         filteredhash = None
+                         if len(cachekey) > 2:
+                             filteredhash = bin(cachekey[2])
+                         bcache = cls(tipnode=last, tiprev=lrev, filteredhash=filteredhash)
+                         if not bcache.validfor(repo):
+                             # invalidate the cache
+                             raise ValueError(r'tip differs')
+                         cl = repo.changelog
+                         for line in lineiter:
+                             line = line.rstrip('\n')
+                             if not line:
+                                 continue
+                             node, state, label = line.split(" ", 2)
+                             if state not in 'oc':
+                                 raise ValueError(r'invalid branch state')
+                             label = encoding.tolocal(label.strip())
+                             node = bin(node)
+                             if not cl.hasnode(node):
+                                 raise ValueError(
+                                     r'node %s does not exist' % pycompat.sysstr(hex(node)))
+                             bcache.setdefault(label, []).append(node)
+                             if state == 'c':
+                                 bcache._closednodes.add(node)
+                     except (IOError, OSError):
+                         return None
+                     except Exception as inst:
+                         if repo.ui.debugflag:
+                             msg = 'invalid branchheads cache'
+                             if repo.filtername is not None:
+                                 msg += ' (%s)' % repo.filtername
+                             msg += ': %s\n'
+                             repo.ui.debug(msg % pycompat.bytestr(inst))
+                         bcache = None
+                     finally:
+                         if f:
+                             f.close()
+                     return bcache
+                 @staticmethod
+                 def _filename(repo):
+                     """name of a branchcache file for a given repo or repoview"""
+                     filename = "branch2"
+                     if repo.filtername:
+                         filename = '%s-%s' % (filename, repo.filtername)
+                     return filename
                  def __init__(self, entries=(), tipnode=nullid, tiprev=nullrev,
                               filteredhash=None, closednodes=None):
                      super(branchcache, self).__init__(entries)
                      self.tipnode = tipnode
                      self.tiprev = tiprev
                      self.filteredhash = filteredhash
                      # closednodes is a set of nodes that close their branch. If the branch
                      # cache has been updated, it may contain nodes that are no longer
                      # heads.
                      if closednodes is None:
                          self._closednodes = set()
                      else:
                          self._closednodes = closednodes
                  def validfor(self, repo):
                      """Is the cache content valid regarding a repo
                      - False when cached tipnode is unknown or if we detect a strip.
                      - True when cache is up to date or a subset of current repo."""
                      try:
                          return ((self.tipnode == repo.changelog.node(self.tiprev))
                                  and (self.filteredhash == \
                                       scmutil.filteredhash(repo, self.tiprev)))
                      except IndexError:
                          return False
                  def _branchtip(self, heads):
                      '''Return tuple with last open head in heads and false,
                      otherwise return last closed head and true.'''
                      tip = heads[-1]
                      closed = True
                      for h in reversed(heads):
                          if h not in self._closednodes:
                              tip = h
                              closed = False
                              break
                      return tip, closed
                  def branchtip(self, branch):
                      '''Return the tipmost open head on branch head, otherwise return the
                      tipmost closed head on branch.
                      Raise KeyError for unknown branch.'''
                      return self._branchtip(self[branch])[0]
                  def iteropen(self, nodes):
                      return (n for n in nodes if n not in self._closednodes)
                  def branchheads(self, branch, closed=False):
                      heads = self[branch]
                      if not closed:
                          heads = list(self.iteropen(heads))
                      return heads
                  def iterbranches(self):
                      for bn, heads in self.iteritems():
                          yield (bn, heads) + self._branchtip(heads)
                  def copy(self):
                      """return an deep copy of the branchcache object"""
                      return branchcache(self, self.tipnode, self.tiprev, self.filteredhash,
                                         self._closednodes)
                  def write(self, repo):
                      try:
-                         f = repo.cachevfs(_filename(repo), "w", atomictemp=True)
+                         f = repo.cachevfs(self._filename(repo), "w", atomictemp=True)
                          cachekey = [hex(self.tipnode), '%d' % self.tiprev]
                          if self.filteredhash is not None:
                              cachekey.append(hex(self.filteredhash))
                          f.write(" ".join(cachekey) + '\n')
                          nodecount = 0
                          for label, nodes in sorted(self.iteritems()):
                              for node in nodes:
                                  nodecount += 1
                                  if node in self._closednodes:
                                      state = 'c'
                                  else:
                                      state = 'o'
                                  f.write("%s %s %s\n" % (hex(node), state,
                                                          encoding.fromlocal(label)))
                          f.close()
                          repo.ui.log('branchcache',
                                      'wrote %s branch cache with %d labels and %d nodes\n',
                                      repo.filtername, len(self), nodecount)
                      except (IOError, OSError, error.Abort) as inst:
                          # Abort may be raised by read only opener, so log and continue
                          repo.ui.debug("couldn't write branch cache: %s\n" %
                                        stringutil.forcebytestr(inst))
                  def update(self, repo, revgen):
                      """Given a branchhead cache, self, that may have extra nodes or be
                      missing heads, and a generator of nodes that are strictly a superset of
                      heads missing, this function updates self to be correct.
                      """
                      starttime = util.timer()
                      cl = repo.changelog
                      # collect new branch entries
                      newbranches = {}
                      getbranchinfo = repo.revbranchcache().branchinfo
                      for r in revgen:
                          branch, closesbranch = getbranchinfo(r)
                          newbranches.setdefault(branch, []).append(r)
                          if closesbranch:
                              self._closednodes.add(cl.node(r))
                      # fetch current topological heads to speed up filtering
                      topoheads = set(cl.headrevs())
                      # if older branchheads are reachable from new ones, they aren't
                      # really branchheads. Note checking parents is insufficient:
                      # 1 (branch a) -> 2 (branch b) -> 3 (branch a)
                      for branch, newheadrevs in newbranches.iteritems():
                          bheads = self.setdefault(branch, [])
                          bheadset = set(cl.rev(node) for node in bheads)
                          # This have been tested True on all internal usage of this function.
                          # run it again in case of doubt
                          # assert not (set(bheadrevs) & set(newheadrevs))
                          bheadset.update(newheadrevs)
                          # This prunes out two kinds of heads - heads that are superseded by
                          # a head in newheadrevs, and newheadrevs that are not heads because
                          # an existing head is their descendant.
                          uncertain = bheadset - topoheads
                          if uncertain:
                              floorrev = min(uncertain)
                              ancestors = set(cl.ancestors(newheadrevs, floorrev))
                              bheadset -= ancestors
                          bheadrevs = sorted(bheadset)
                          self[branch] = [cl.node(rev) for rev in bheadrevs]
                          tiprev = bheadrevs[-1]
                          if tiprev > self.tiprev:
                              self.tipnode = cl.node(tiprev)
                              self.tiprev = tiprev
                      if not self.validfor(repo):
                          # cache key are not valid anymore
                          self.tipnode = nullid
                          self.tiprev = nullrev
                          for heads in self.values():
                              tiprev = max(cl.rev(node) for node in heads)
                              if tiprev > self.tiprev:
                                  self.tipnode = cl.node(tiprev)
                                  self.tiprev = tiprev
                      self.filteredhash = scmutil.filteredhash(repo, self.tiprev)
                      duration = util.timer() - starttime
                      repo.ui.log('branchcache', 'updated %s branch cache in %.4f seconds\n',
                                  repo.filtername, duration)
              # Revision branch info cache
              _rbcversion = '-v1'
              _rbcnames = 'rbc-names' + _rbcversion
              _rbcrevs = 'rbc-revs' + _rbcversion
              # [4 byte hash prefix][4 byte branch name number with sign bit indicating open]
              _rbcrecfmt = '>4sI'
              _rbcrecsize = calcsize(_rbcrecfmt)
              _rbcnodelen = 4
              _rbcbranchidxmask = 0x7fffffff
              _rbccloseflag = 0x80000000
              class revbranchcache(object):
                  """Persistent cache, mapping from revision number to branch name and close.
                  This is a low level cache, independent of filtering.
                  Branch names are stored in rbc-names in internal encoding separated by 0.
                  rbc-names is append-only, and each branch name is only stored once and will
                  thus have a unique index.
                  The branch info for each revision is stored in rbc-revs as constant size
                  records. The whole file is read into memory, but it is only 'parsed' on
                  demand. The file is usually append-only but will be truncated if repo
                  modification is detected.
                  The record for each revision contains the first 4 bytes of the
                  corresponding node hash, and the record is only used if it still matches.
                  Even a completely trashed rbc-revs fill thus still give the right result
                  while converging towards full recovery ... assuming no incorrectly matching
                  node hashes.
                  The record also contains 4 bytes where 31 bits contains the index of the
                  branch and the last bit indicate that it is a branch close commit.
                  The usage pattern for rbc-revs is thus somewhat similar to 00changelog.i
                  and will grow with it but be 1/8th of its size.
                  """
                  def __init__(self, repo, readonly=True):
                      assert repo.filtername is None
                      self._repo = repo
                      self._names = [] # branch names in local encoding with static index
                      self._rbcrevs = bytearray()
                      self._rbcsnameslen = 0 # length of names read at _rbcsnameslen
                      try:
                          bndata = repo.cachevfs.read(_rbcnames)
                          self._rbcsnameslen = len(bndata) # for verification before writing
                          if bndata:
                              self._names = [encoding.tolocal(bn)
                                             for bn in bndata.split('\0')]
                      except (IOError, OSError):
                          if readonly:
                              # don't try to use cache - fall back to the slow path
                              self.branchinfo = self._branchinfo
                      if self._names:
                          try:
                              data = repo.cachevfs.read(_rbcrevs)
                              self._rbcrevs[:] = data
                          except (IOError, OSError) as inst:
                              repo.ui.debug("couldn't read revision branch cache: %s\n" %
                                            stringutil.forcebytestr(inst))
                      # remember number of good records on disk
                      self._rbcrevslen = min(len(self._rbcrevs) // _rbcrecsize,
                                             len(repo.changelog))
                      if self._rbcrevslen == 0:
                          self._names = []
                      self._rbcnamescount = len(self._names) # number of names read at
                                                             # _rbcsnameslen
                  def _clear(self):
                      self._rbcsnameslen = 0
                      del self._names[:]
                      self._rbcnamescount = 0
                      self._rbcrevslen = len(self._repo.changelog)
                      self._rbcrevs = bytearray(self._rbcrevslen * _rbcrecsize)
                      util.clearcachedproperty(self, '_namesreverse')
                  @util.propertycache
                  def _namesreverse(self):
                      return dict((b, r) for r, b in enumerate(self._names))
                  def branchinfo(self, rev):
                      """Return branch name and close flag for rev, using and updating
                      persistent cache."""
                      changelog = self._repo.changelog
                      rbcrevidx = rev * _rbcrecsize
                      # avoid negative index, changelog.read(nullrev) is fast without cache
                      if rev == nullrev:
                          return changelog.branchinfo(rev)
                      # if requested rev isn't allocated, grow and cache the rev info
                      if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:
                          return self._branchinfo(rev)
                      # fast path: extract data from cache, use it if node is matching
                      reponode = changelog.node(rev)[:_rbcnodelen]
                      cachenode, branchidx = unpack_from(
                          _rbcrecfmt, util.buffer(self._rbcrevs), rbcrevidx)
                      close = bool(branchidx & _rbccloseflag)
                      if close:
                          branchidx &= _rbcbranchidxmask
                      if cachenode == '\0\0\0\0':
                          pass
                      elif cachenode == reponode:
                          try:
                              return self._names[branchidx], close
                          except IndexError:
                              # recover from invalid reference to unknown branch
                              self._repo.ui.debug("referenced branch names not found"
                                  " - rebuilding revision branch cache from scratch\n")
                              self._clear()
                      else:
                          # rev/node map has changed, invalidate the cache from here up
                          self._repo.ui.debug("history modification detected - truncating "
                              "revision branch cache to revision %d\n" % rev)
                          truncate = rbcrevidx + _rbcrecsize
                          del self._rbcrevs[truncate:]
                          self._rbcrevslen = min(self._rbcrevslen, truncate)
                      # fall back to slow path and make sure it will be written to disk
                      return self._branchinfo(rev)
                  def _branchinfo(self, rev):
                      """Retrieve branch info from changelog and update _rbcrevs"""
                      changelog = self._repo.changelog
                      b, close = changelog.branchinfo(rev)
                      if b in self._namesreverse:
                          branchidx = self._namesreverse[b]
                      else:
                          branchidx = len(self._names)
                          self._names.append(b)
                          self._namesreverse[b] = branchidx
                      reponode = changelog.node(rev)
                      if close:
                          branchidx |= _rbccloseflag
                      self._setcachedata(rev, reponode, branchidx)
                      return b, close
                  def setdata(self, branch, rev, node, close):
                      """add new data information to the cache"""
                      if branch in self._namesreverse:
                          branchidx = self._namesreverse[branch]
                      else:
                          branchidx = len(self._names)
                          self._names.append(branch)
                          self._namesreverse[branch] = branchidx
                      if close:
                          branchidx |= _rbccloseflag
                      self._setcachedata(rev, node, branchidx)
                      # If no cache data were readable (non exists, bad permission, etc)
                      # the cache was bypassing itself by setting:
                      #
                      #   self.branchinfo = self._branchinfo
                      #
                      # Since we now have data in the cache, we need to drop this bypassing.
                      if r'branchinfo' in vars(self):
                          del self.branchinfo
                  def _setcachedata(self, rev, node, branchidx):
                      """Writes the node's branch data to the in-memory cache data."""
                      if rev == nullrev:
                          return
                      rbcrevidx = rev * _rbcrecsize
                      if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:
                          self._rbcrevs.extend('\0' *
                                               (len(self._repo.changelog) * _rbcrecsize -
                                                len(self._rbcrevs)))
                      pack_into(_rbcrecfmt, self._rbcrevs, rbcrevidx, node, branchidx)
                      self._rbcrevslen = min(self._rbcrevslen, rev)
                      tr = self._repo.currenttransaction()
                      if tr:
                          tr.addfinalize('write-revbranchcache', self.write)
                  def write(self, tr=None):
                      """Save branch cache if it is dirty."""
                      repo = self._repo
                      wlock = None
                      step = ''
                      try:
                          if self._rbcnamescount < len(self._names):
                              step = ' names'
                              wlock = repo.wlock(wait=False)
                              if self._rbcnamescount != 0:
                                  f = repo.cachevfs.open(_rbcnames, 'ab')
                                  if f.tell() == self._rbcsnameslen:
                                      f.write('\0')
                                  else:
                                      f.close()
                                      repo.ui.debug("%s changed - rewriting it\n" % _rbcnames)
                                      self._rbcnamescount = 0
                                      self._rbcrevslen = 0
                              if self._rbcnamescount == 0:
                                  # before rewriting names, make sure references are removed
                                  repo.cachevfs.unlinkpath(_rbcrevs, ignoremissing=True)
                                  f = repo.cachevfs.open(_rbcnames, 'wb')
                              f.write('\0'.join(encoding.fromlocal(b)
                                                for b in self._names[self._rbcnamescount:]))
                              self._rbcsnameslen = f.tell()
                              f.close()
                              self._rbcnamescount = len(self._names)
                          start = self._rbcrevslen * _rbcrecsize
                          if start != len(self._rbcrevs):
                              step = ''
                              if wlock is None:
                                  wlock = repo.wlock(wait=False)
                              revs = min(len(repo.changelog),
                                         len(self._rbcrevs) // _rbcrecsize)
                              f = repo.cachevfs.open(_rbcrevs, 'ab')
                              if f.tell() != start:
                                  repo.ui.debug("truncating cache/%s to %d\n"
                                                % (_rbcrevs, start))
                                  f.seek(start)
                                  if f.tell() != start:
                                      start = 0
                                      f.seek(start)
                                  f.truncate()
                              end = revs * _rbcrecsize
                              f.write(self._rbcrevs[start:end])
                              f.close()
                              self._rbcrevslen = revs
                      except (IOError, OSError, error.Abort, error.LockError) as inst:
                          repo.ui.debug("couldn't write revision branch cache%s: %s\n"
                                        % (step, stringutil.forcebytestr(inst)))
                      finally:
                          if wlock is not None:
                              wlock.release()

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages