upstream/mercurial-mirror Commit - r30370:10c92459

manifest: move clearcaches to manifestlog...

Durham Goode -

r30370:10c92459 default

parent child

contrib/perf.py

0 +1 -1

              # perf.py - performance test routines
              '''helper extension to measure performance'''
              # "historical portability" policy of perf.py:
              #
              # We have to do:
              # - make perf.py "loadable" with as wide Mercurial version as possible
              #   This doesn't mean that perf commands work correctly with that Mercurial.
              #   BTW, perf.py itself has been available since 1.1 (or eb240755386d).
              # - make historical perf command work correctly with as wide Mercurial
              #   version as possible
              #
              # We have to do, if possible with reasonable cost:
              # - make recent perf command for historical feature work correctly
              #   with early Mercurial
              #
              # We don't have to do:
              # - make perf command for recent feature work correctly with early
              #   Mercurial
              from __future__ import absolute_import
              import functools
              import os
              import random
              import sys
              import time
              from mercurial import (
                  bdiff,
                  changegroup,
                  cmdutil,
                  commands,
                  copies,
                  error,
                  extensions,
                  mdiff,
                  merge,
                  revlog,
                  util,
              )
              # for "historical portability":
              # try to import modules separately (in dict order), and ignore
              # failure, because these aren't available with early Mercurial
              try:
                  from mercurial import branchmap # since 2.5 (or bcee63733aad)
              except ImportError:
                  pass
              try:
                  from mercurial import obsolete # since 2.3 (or ad0d6c2b3279)
              except ImportError:
                  pass
              try:
                  from mercurial import repoview # since 2.5 (or 3a6ddacb7198)
              except ImportError:
                  pass
              try:
                  from mercurial import scmutil # since 1.9 (or 8b252e826c68)
              except ImportError:
                  pass
              # for "historical portability":
              # define util.safehasattr forcibly, because util.safehasattr has been
              # available since 1.9.3 (or 94b200a11cf7)
              _undefined = object()
              def safehasattr(thing, attr):
                  return getattr(thing, attr, _undefined) is not _undefined
              setattr(util, 'safehasattr', safehasattr)
              # for "historical portability":
              # use locally defined empty option list, if formatteropts isn't
              # available, because commands.formatteropts has been available since
              # 3.2 (or 7a7eed5176a4), even though formatting itself has been
              # available since 2.2 (or ae5f92e154d3)
              formatteropts = getattr(commands, "formatteropts", [])
              # for "historical portability":
              # use locally defined option list, if debugrevlogopts isn't available,
              # because commands.debugrevlogopts has been available since 3.7 (or
              # 5606f7d0d063), even though cmdutil.openrevlog() has been available
              # since 1.9 (or a79fea6b3e77).
              revlogopts = getattr(commands, "debugrevlogopts", [
                      ('c', 'changelog', False, ('open changelog')),
                      ('m', 'manifest', False, ('open manifest')),
                      ('', 'dir', False, ('open directory manifest')),
                      ])
              cmdtable = {}
              # for "historical portability":
              # define parsealiases locally, because cmdutil.parsealiases has been
              # available since 1.5 (or 6252852b4332)
              def parsealiases(cmd):
                  return cmd.lstrip("^").split("|")
              if safehasattr(cmdutil, 'command'):
                  import inspect
                  command = cmdutil.command(cmdtable)
                  if 'norepo' not in inspect.getargspec(command)[0]:
                      # for "historical portability":
                      # wrap original cmdutil.command, because "norepo" option has
                      # been available since 3.1 (or 75a96326cecb)
                      _command = command
                      def command(name, options=(), synopsis=None, norepo=False):
                          if norepo:
                              commands.norepo += ' %s' % ' '.join(parsealiases(name))
                          return _command(name, list(options), synopsis)
              else:
                  # for "historical portability":
                  # define "@command" annotation locally, because cmdutil.command
                  # has been available since 1.9 (or 2daa5179e73f)
                  def command(name, options=(), synopsis=None, norepo=False):
                      def decorator(func):
                          if synopsis:
                              cmdtable[name] = func, list(options), synopsis
                          else:
                              cmdtable[name] = func, list(options)
                          if norepo:
                              commands.norepo += ' %s' % ' '.join(parsealiases(name))
                          return func
                      return decorator
              def getlen(ui):
                  if ui.configbool("perf", "stub"):
                      return lambda x: 1
                  return len
              def gettimer(ui, opts=None):
                  """return a timer function and formatter: (timer, formatter)
                  This function exists to gather the creation of formatter in a single
                  place instead of duplicating it in all performance commands."""
                  # enforce an idle period before execution to counteract power management
                  # experimental config: perf.presleep
                  time.sleep(getint(ui, "perf", "presleep", 1))
                  if opts is None:
                      opts = {}
                  # redirect all to stderr
                  ui = ui.copy()
                  uifout = safeattrsetter(ui, 'fout', ignoremissing=True)
                  if uifout:
                      # for "historical portability":
                      # ui.fout/ferr have been available since 1.9 (or 4e1ccd4c2b6d)
                      uifout.set(ui.ferr)
                  # get a formatter
                  uiformatter = getattr(ui, 'formatter', None)
                  if uiformatter:
                      fm = uiformatter('perf', opts)
                  else:
                      # for "historical portability":
                      # define formatter locally, because ui.formatter has been
                      # available since 2.2 (or ae5f92e154d3)
                      from mercurial import node
                      class defaultformatter(object):
                          """Minimized composition of baseformatter and plainformatter
                          """
                          def __init__(self, ui, topic, opts):
                              self._ui = ui
                              if ui.debugflag:
                                  self.hexfunc = node.hex
                              else:
                                  self.hexfunc = node.short
                          def __nonzero__(self):
                              return False
                          def startitem(self):
                              pass
                          def data(self, **data):
                              pass
                          def write(self, fields, deftext, *fielddata, **opts):
                              self._ui.write(deftext % fielddata, **opts)
                          def condwrite(self, cond, fields, deftext, *fielddata, **opts):
                              if cond:
                                  self._ui.write(deftext % fielddata, **opts)
                          def plain(self, text, **opts):
                              self._ui.write(text, **opts)
                          def end(self):
                              pass
                      fm = defaultformatter(ui, 'perf', opts)
                  # stub function, runs code only once instead of in a loop
                  # experimental config: perf.stub
                  if ui.configbool("perf", "stub"):
                      return functools.partial(stub_timer, fm), fm
                  return functools.partial(_timer, fm), fm
              def stub_timer(fm, func, title=None):
                  func()
              def _timer(fm, func, title=None):
                  results = []
                  begin = time.time()
                  count = 0
                  while True:
                      ostart = os.times()
                      cstart = time.time()
                      r = func()
                      cstop = time.time()
                      ostop = os.times()
                      count += 1
                      a, b = ostart, ostop
                      results.append((cstop - cstart, b[0] - a[0], b[1]-a[1]))
                      if cstop - begin > 3 and count >= 100:
                          break
                      if cstop - begin > 10 and count >= 3:
                          break
                  fm.startitem()
                  if title:
                      fm.write('title', '! %s\n', title)
                  if r:
                      fm.write('result', '! result: %s\n', r)
                  m = min(results)
                  fm.plain('!')
                  fm.write('wall', ' wall %f', m[0])
                  fm.write('comb', ' comb %f', m[1] + m[2])
                  fm.write('user', ' user %f', m[1])
                  fm.write('sys',  ' sys %f', m[2])
                  fm.write('count',  ' (best of %d)', count)
                  fm.plain('\n')
              # utilities for historical portability
              def getint(ui, section, name, default):
                  # for "historical portability":
                  # ui.configint has been available since 1.9 (or fa2b596db182)
                  v = ui.config(section, name, None)
                  if v is None:
                      return default
                  try:
                      return int(v)
                  except ValueError:
                      raise error.ConfigError(("%s.%s is not an integer ('%s')")
                                              % (section, name, v))
              def safeattrsetter(obj, name, ignoremissing=False):
                  """Ensure that 'obj' has 'name' attribute before subsequent setattr
                  This function is aborted, if 'obj' doesn't have 'name' attribute
                  at runtime. This avoids overlooking removal of an attribute, which
                  breaks assumption of performance measurement, in the future.
                  This function returns the object to (1) assign a new value, and
                  (2) restore an original value to the attribute.
                  If 'ignoremissing' is true, missing 'name' attribute doesn't cause
                  abortion, and this function returns None. This is useful to
                  examine an attribute, which isn't ensured in all Mercurial
                  versions.
                  """
                  if not util.safehasattr(obj, name):
                      if ignoremissing:
                          return None
                      raise error.Abort(("missing attribute %s of %s might break assumption"
                                         " of performance measurement") % (name, obj))
                  origvalue = getattr(obj, name)
                  class attrutil(object):
                      def set(self, newvalue):
                          setattr(obj, name, newvalue)
                      def restore(self):
                          setattr(obj, name, origvalue)
                  return attrutil()
              # utilities to examine each internal API changes
              def getbranchmapsubsettable():
                  # for "historical portability":
                  # subsettable is defined in:
                  # - branchmap since 2.9 (or 175c6fd8cacc)
                  # - repoview since 2.5 (or 59a9f18d4587)
                  for mod in (branchmap, repoview):
                      subsettable = getattr(mod, 'subsettable', None)
                      if subsettable:
                          return subsettable
                  # bisecting in bcee63733aad::59a9f18d4587 can reach here (both
                  # branchmap and repoview modules exist, but subsettable attribute
                  # doesn't)
                  raise error.Abort(("perfbranchmap not available with this Mercurial"),
                                    hint="use 2.5 or later")
              def getsvfs(repo):
                  """Return appropriate object to access files under .hg/store
                  """
                  # for "historical portability":
                  # repo.svfs has been available since 2.3 (or 7034365089bf)
                  svfs = getattr(repo, 'svfs', None)
                  if svfs:
                      return svfs
                  else:
                      return getattr(repo, 'sopener')
              def getvfs(repo):
                  """Return appropriate object to access files under .hg
                  """
                  # for "historical portability":
                  # repo.vfs has been available since 2.3 (or 7034365089bf)
                  vfs = getattr(repo, 'vfs', None)
                  if vfs:
                      return vfs
                  else:
                      return getattr(repo, 'opener')
              def repocleartagscachefunc(repo):
                  """Return the function to clear tags cache according to repo internal API
                  """
                  if util.safehasattr(repo, '_tagscache'): # since 2.0 (or 9dca7653b525)
                      # in this case, setattr(repo, '_tagscache', None) or so isn't
                      # correct way to clear tags cache, because existing code paths
                      # expect _tagscache to be a structured object.
                      def clearcache():
                          # _tagscache has been filteredpropertycache since 2.5 (or
                          # 98c867ac1330), and delattr() can't work in such case
                          if '_tagscache' in vars(repo):
                              del repo.__dict__['_tagscache']
                      return clearcache
                  repotags = safeattrsetter(repo, '_tags', ignoremissing=True)
                  if repotags: # since 1.4 (or 5614a628d173)
                      return lambda : repotags.set(None)
                  repotagscache = safeattrsetter(repo, 'tagscache', ignoremissing=True)
                  if repotagscache: # since 0.6 (or d7df759d0e97)
                      return lambda : repotagscache.set(None)
                  # Mercurial earlier than 0.6 (or d7df759d0e97) logically reaches
                  # this point, but it isn't so problematic, because:
                  # - repo.tags of such Mercurial isn't "callable", and repo.tags()
                  #   in perftags() causes failure soon
                  # - perf.py itself has been available since 1.1 (or eb240755386d)
                  raise error.Abort(("tags API of this hg command is unknown"))
              # perf commands
              @command('perfwalk', formatteropts)
              def perfwalk(ui, repo, *pats, **opts):
                  timer, fm = gettimer(ui, opts)
                  try:
                      m = scmutil.match(repo[None], pats, {})
                      timer(lambda: len(list(repo.dirstate.walk(m, [], True, False))))
                  except Exception:
                      try:
                          m = scmutil.match(repo[None], pats, {})
                          timer(lambda: len([b for a, b, c in repo.dirstate.statwalk([], m)]))
                      except Exception:
                          timer(lambda: len(list(cmdutil.walk(repo, pats, {}))))
                  fm.end()
              @command('perfannotate', formatteropts)
              def perfannotate(ui, repo, f, **opts):
                  timer, fm = gettimer(ui, opts)
                  fc = repo['.'][f]
                  timer(lambda: len(fc.annotate(True)))
                  fm.end()
              @command('perfstatus',
                       [('u', 'unknown', False,
                         'ask status to look for unknown files')] + formatteropts)
              def perfstatus(ui, repo, **opts):
                  #m = match.always(repo.root, repo.getcwd())
                  #timer(lambda: sum(map(len, repo.dirstate.status(m, [], False, False,
                  #                                                False))))
                  timer, fm = gettimer(ui, opts)
                  timer(lambda: sum(map(len, repo.status(unknown=opts['unknown']))))
                  fm.end()
              @command('perfaddremove', formatteropts)
              def perfaddremove(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  try:
                      oldquiet = repo.ui.quiet
                      repo.ui.quiet = True
                      matcher = scmutil.match(repo[None])
                      timer(lambda: scmutil.addremove(repo, matcher, "", dry_run=True))
                  finally:
                      repo.ui.quiet = oldquiet
                      fm.end()
              def clearcaches(cl):
                  # behave somewhat consistently across internal API changes
                  if util.safehasattr(cl, 'clearcaches'):
                      cl.clearcaches()
                  elif util.safehasattr(cl, '_nodecache'):
                      from mercurial.node import nullid, nullrev
                      cl._nodecache = {nullid: nullrev}
                      cl._nodepos = None
              @command('perfheads', formatteropts)
              def perfheads(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  cl = repo.changelog
                  def d():
                      len(cl.headrevs())
                      clearcaches(cl)
                  timer(d)
                  fm.end()
              @command('perftags', formatteropts)
              def perftags(ui, repo, **opts):
                  import mercurial.changelog
                  import mercurial.manifest
                  timer, fm = gettimer(ui, opts)
                  svfs = getsvfs(repo)
                  repocleartagscache = repocleartagscachefunc(repo)
                  def t():
                      repo.changelog = mercurial.changelog.changelog(svfs)
                      repo.manifestlog = mercurial.manifest.manifestlog(svfs, repo)
                      repocleartagscache()
                      return len(repo.tags())
                  timer(t)
                  fm.end()
              @command('perfancestors', formatteropts)
              def perfancestors(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  heads = repo.changelog.headrevs()
                  def d():
                      for a in repo.changelog.ancestors(heads):
                          pass
                  timer(d)
                  fm.end()
              @command('perfancestorset', formatteropts)
              def perfancestorset(ui, repo, revset, **opts):
                  timer, fm = gettimer(ui, opts)
                  revs = repo.revs(revset)
                  heads = repo.changelog.headrevs()
                  def d():
                      s = repo.changelog.ancestors(heads)
                      for rev in revs:
                          rev in s
                  timer(d)
                  fm.end()
              @command('perfchangegroupchangelog', formatteropts +
                       [('', 'version', '02', 'changegroup version'),
                        ('r', 'rev', '', 'revisions to add to changegroup')])
              def perfchangegroupchangelog(ui, repo, version='02', rev=None, **opts):
                  """Benchmark producing a changelog group for a changegroup.
                  This measures the time spent processing the changelog during a
                  bundle operation. This occurs during `hg bundle` and on a server
                  processing a `getbundle` wire protocol request (handles clones
                  and pull requests).
                  By default, all revisions are added to the changegroup.
                  """
                  cl = repo.changelog
                  revs = [cl.lookup(r) for r in repo.revs(rev or 'all()')]
                  bundler = changegroup.getbundler(version, repo)
                  def lookup(node):
                      # The real bundler reads the revision in order to access the
                      # manifest node and files list. Do that here.
                      cl.read(node)
                      return node
                  def d():
                      for chunk in bundler.group(revs, cl, lookup):
                          pass
                  timer, fm = gettimer(ui, opts)
                  timer(d)
                  fm.end()
              @command('perfdirs', formatteropts)
              def perfdirs(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  'a' in dirstate
                  def d():
                      dirstate.dirs()
                      del dirstate._dirs
                  timer(d)
                  fm.end()
              @command('perfdirstate', formatteropts)
              def perfdirstate(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  "a" in repo.dirstate
                  def d():
                      repo.dirstate.invalidate()
                      "a" in repo.dirstate
                  timer(d)
                  fm.end()
              @command('perfdirstatedirs', formatteropts)
              def perfdirstatedirs(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  "a" in repo.dirstate
                  def d():
                      "a" in repo.dirstate._dirs
                      del repo.dirstate._dirs
                  timer(d)
                  fm.end()
              @command('perfdirstatefoldmap', formatteropts)
              def perfdirstatefoldmap(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  'a' in dirstate
                  def d():
                      dirstate._filefoldmap.get('a')
                      del dirstate._filefoldmap
                  timer(d)
                  fm.end()
              @command('perfdirfoldmap', formatteropts)
              def perfdirfoldmap(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  dirstate = repo.dirstate
                  'a' in dirstate
                  def d():
                      dirstate._dirfoldmap.get('a')
                      del dirstate._dirfoldmap
                      del dirstate._dirs
                  timer(d)
                  fm.end()
              @command('perfdirstatewrite', formatteropts)
              def perfdirstatewrite(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  ds = repo.dirstate
                  "a" in ds
                  def d():
                      ds._dirty = True
                      ds.write(repo.currenttransaction())
                  timer(d)
                  fm.end()
              @command('perfmergecalculate',
                       [('r', 'rev', '.', 'rev to merge against')] + formatteropts)
              def perfmergecalculate(ui, repo, rev, **opts):
                  timer, fm = gettimer(ui, opts)
                  wctx = repo[None]
                  rctx = scmutil.revsingle(repo, rev, rev)
                  ancestor = wctx.ancestor(rctx)
                  # we don't want working dir files to be stat'd in the benchmark, so prime
                  # that cache
                  wctx.dirty()
                  def d():
                      # acceptremote is True because we don't want prompts in the middle of
                      # our benchmark
                      merge.calculateupdates(repo, wctx, rctx, [ancestor], False, False,
                                             acceptremote=True, followcopies=True)
                  timer(d)
                  fm.end()
              @command('perfpathcopies', [], "REV REV")
              def perfpathcopies(ui, repo, rev1, rev2, **opts):
                  timer, fm = gettimer(ui, opts)
                  ctx1 = scmutil.revsingle(repo, rev1, rev1)
                  ctx2 = scmutil.revsingle(repo, rev2, rev2)
                  def d():
                      copies.pathcopies(ctx1, ctx2)
                  timer(d)
                  fm.end()
              @command('perfmanifest', [], 'REV')
              def perfmanifest(ui, repo, rev, **opts):
                  timer, fm = gettimer(ui, opts)
                  ctx = scmutil.revsingle(repo, rev, rev)
                  t = ctx.manifestnode()
                  def d():
-                     repo.manifest.clearcaches()
+                     repo.manifestlog.clearcaches()
                      repo.manifestlog[t].read()
                  timer(d)
                  fm.end()
              @command('perfchangeset', formatteropts)
              def perfchangeset(ui, repo, rev, **opts):
                  timer, fm = gettimer(ui, opts)
                  n = repo[rev].node()
                  def d():
                      repo.changelog.read(n)
                      #repo.changelog._cache = None
                  timer(d)
                  fm.end()
              @command('perfindex', formatteropts)
              def perfindex(ui, repo, **opts):
                  import mercurial.revlog
                  timer, fm = gettimer(ui, opts)
                  mercurial.revlog._prereadsize = 2**24 # disable lazy parser in old hg
                  n = repo["tip"].node()
                  svfs = getsvfs(repo)
                  def d():
                      cl = mercurial.revlog.revlog(svfs, "00changelog.i")
                      cl.rev(n)
                  timer(d)
                  fm.end()
              @command('perfstartup', formatteropts)
              def perfstartup(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  cmd = sys.argv[0]
                  def d():
                      if os.name != 'nt':
                          os.system("HGRCPATH= %s version -q > /dev/null" % cmd)
                      else:
                          os.environ['HGRCPATH'] = ''
                          os.system("%s version -q > NUL" % cmd)
                  timer(d)
                  fm.end()
              @command('perfparents', formatteropts)
              def perfparents(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  # control the number of commits perfparents iterates over
                  # experimental config: perf.parentscount
                  count = getint(ui, "perf", "parentscount", 1000)
                  if len(repo.changelog) < count:
                      raise error.Abort("repo needs %d commits for this test" % count)
                  repo = repo.unfiltered()
                  nl = [repo.changelog.node(i) for i in xrange(count)]
                  def d():
                      for n in nl:
                          repo.changelog.parents(n)
                  timer(d)
                  fm.end()
              @command('perfctxfiles', formatteropts)
              def perfctxfiles(ui, repo, x, **opts):
                  x = int(x)
                  timer, fm = gettimer(ui, opts)
                  def d():
                      len(repo[x].files())
                  timer(d)
                  fm.end()
              @command('perfrawfiles', formatteropts)
              def perfrawfiles(ui, repo, x, **opts):
                  x = int(x)
                  timer, fm = gettimer(ui, opts)
                  cl = repo.changelog
                  def d():
                      len(cl.read(x)[3])
                  timer(d)
                  fm.end()
              @command('perflookup', formatteropts)
              def perflookup(ui, repo, rev, **opts):
                  timer, fm = gettimer(ui, opts)
                  timer(lambda: len(repo.lookup(rev)))
                  fm.end()
              @command('perfrevrange', formatteropts)
              def perfrevrange(ui, repo, *specs, **opts):
                  timer, fm = gettimer(ui, opts)
                  revrange = scmutil.revrange
                  timer(lambda: len(revrange(repo, specs)))
                  fm.end()
              @command('perfnodelookup', formatteropts)
              def perfnodelookup(ui, repo, rev, **opts):
                  timer, fm = gettimer(ui, opts)
                  import mercurial.revlog
                  mercurial.revlog._prereadsize = 2**24 # disable lazy parser in old hg
                  n = repo[rev].node()
                  cl = mercurial.revlog.revlog(getsvfs(repo), "00changelog.i")
                  def d():
                      cl.rev(n)
                      clearcaches(cl)
                  timer(d)
                  fm.end()
              @command('perflog',
                       [('', 'rename', False, 'ask log to follow renames')] + formatteropts)
              def perflog(ui, repo, rev=None, **opts):
                  if rev is None:
                      rev=[]
                  timer, fm = gettimer(ui, opts)
                  ui.pushbuffer()
                  timer(lambda: commands.log(ui, repo, rev=rev, date='', user='',
                                             copies=opts.get('rename')))
                  ui.popbuffer()
                  fm.end()
              @command('perfmoonwalk', formatteropts)
              def perfmoonwalk(ui, repo, **opts):
                  """benchmark walking the changelog backwards
                  This also loads the changelog data for each revision in the changelog.
                  """
                  timer, fm = gettimer(ui, opts)
                  def moonwalk():
                      for i in xrange(len(repo), -1, -1):
                          ctx = repo[i]
                          ctx.branch() # read changelog data (in addition to the index)
                  timer(moonwalk)
                  fm.end()
              @command('perftemplating', formatteropts)
              def perftemplating(ui, repo, rev=None, **opts):
                  if rev is None:
                      rev=[]
                  timer, fm = gettimer(ui, opts)
                  ui.pushbuffer()
                  timer(lambda: commands.log(ui, repo, rev=rev, date='', user='',
                                             template='{date|shortdate} [{rev}:{node|short}]'
                                             ' {author|person}: {desc|firstline}\n'))
                  ui.popbuffer()
                  fm.end()
              @command('perfcca', formatteropts)
              def perfcca(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  timer(lambda: scmutil.casecollisionauditor(ui, False, repo.dirstate))
                  fm.end()
              @command('perffncacheload', formatteropts)
              def perffncacheload(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  s = repo.store
                  def d():
                      s.fncache._load()
                  timer(d)
                  fm.end()
              @command('perffncachewrite', formatteropts)
              def perffncachewrite(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  s = repo.store
                  s.fncache._load()
                  lock = repo.lock()
                  tr = repo.transaction('perffncachewrite')
                  def d():
                      s.fncache._dirty = True
                      s.fncache.write(tr)
                  timer(d)
                  tr.close()
                  lock.release()
                  fm.end()
              @command('perffncacheencode', formatteropts)
              def perffncacheencode(ui, repo, **opts):
                  timer, fm = gettimer(ui, opts)
                  s = repo.store
                  s.fncache._load()
                  def d():
                      for p in s.fncache.entries:
                          s.encode(p)
                  timer(d)
                  fm.end()
              @command('perfbdiff', revlogopts + formatteropts + [
                  ('', 'count', 1, 'number of revisions to test (when using --startrev)'),
                  ('', 'alldata', False, 'test bdiffs for all associated revisions')],
                  '-c|-m|FILE REV')
              def perfbdiff(ui, repo, file_, rev=None, count=None, **opts):
                  """benchmark a bdiff between revisions
                  By default, benchmark a bdiff between its delta parent and itself.
                  With ``--count``, benchmark bdiffs between delta parents and self for N
                  revisions starting at the specified revision.
                  With ``--alldata``, assume the requested revision is a changeset and
                  measure bdiffs for all changes related to that changeset (manifest
                  and filelogs).
                  """
                  if opts['alldata']:
                      opts['changelog'] = True
                  if opts.get('changelog') or opts.get('manifest'):
                      file_, rev = None, file_
                  elif rev is None:
                      raise error.CommandError('perfbdiff', 'invalid arguments')
                  textpairs = []
                  r = cmdutil.openrevlog(repo, 'perfbdiff', file_, opts)
                  startrev = r.rev(r.lookup(rev))
                  for rev in range(startrev, min(startrev + count, len(r) - 1)):
                      if opts['alldata']:
                          # Load revisions associated with changeset.
                          ctx = repo[rev]
                          mtext = repo.manifest.revision(ctx.manifestnode())
                          for pctx in ctx.parents():
                              pman = repo.manifest.revision(pctx.manifestnode())
                              textpairs.append((pman, mtext))
                          # Load filelog revisions by iterating manifest delta.
                          man = ctx.manifest()
                          pman = ctx.p1().manifest()
                          for filename, change in pman.diff(man).items():
                              fctx = repo.file(filename)
                              f1 = fctx.revision(change[0][0] or -1)
                              f2 = fctx.revision(change[1][0] or -1)
                              textpairs.append((f1, f2))
                      else:
                          dp = r.deltaparent(rev)
                          textpairs.append((r.revision(dp), r.revision(rev)))
                  def d():
                      for pair in textpairs:
                          bdiff.bdiff(*pair)
                  timer, fm = gettimer(ui, opts)
                  timer(d)
                  fm.end()
              @command('perfdiffwd', formatteropts)
              def perfdiffwd(ui, repo, **opts):
                  """Profile diff of working directory changes"""
                  timer, fm = gettimer(ui, opts)
                  options = {
                      'w': 'ignore_all_space',
                      'b': 'ignore_space_change',
                      'B': 'ignore_blank_lines',
                      }
                  for diffopt in ('', 'w', 'b', 'B', 'wB'):
                      opts = dict((options[c], '1') for c in diffopt)
                      def d():
                          ui.pushbuffer()
                          commands.diff(ui, repo, **opts)
                          ui.popbuffer()
                      title = 'diffopts: %s' % (diffopt and ('-' + diffopt) or 'none')
                      timer(d, title)
                  fm.end()
              @command('perfrevlog', revlogopts + formatteropts +
                       [('d', 'dist', 100, 'distance between the revisions'),
                        ('s', 'startrev', 0, 'revision to start reading at'),
                        ('', 'reverse', False, 'read in reverse')],
                       '-c|-m|FILE')
              def perfrevlog(ui, repo, file_=None, startrev=0, reverse=False, **opts):
                  """Benchmark reading a series of revisions from a revlog.
                  By default, we read every ``-d/--dist`` revision from 0 to tip of
                  the specified revlog.
                  The start revision can be defined via ``-s/--startrev``.
                  """
                  timer, fm = gettimer(ui, opts)
                  _len = getlen(ui)
                  def d():
                      r = cmdutil.openrevlog(repo, 'perfrevlog', file_, opts)
                      startrev = 0
                      endrev = _len(r)
                      dist = opts['dist']
                      if reverse:
                          startrev, endrev = endrev, startrev
                          dist = -1 * dist
                      for x in xrange(startrev, endrev, dist):
                          r.revision(r.node(x))
                  timer(d)
                  fm.end()
              @command('perfrevlogrevision', revlogopts + formatteropts +
                       [('', 'cache', False, 'use caches instead of clearing')],
                       '-c|-m|FILE REV')
              def perfrevlogrevision(ui, repo, file_, rev=None, cache=None, **opts):
                  """Benchmark obtaining a revlog revision.
                  Obtaining a revlog revision consists of roughly the following steps:
 . Compute the delta chain
 . Obtain the raw chunks for that delta chain
 . Decompress each raw chunk
 . Apply binary patches to obtain fulltext
 . Verify hash of fulltext
                  This command measures the time spent in each of these phases.
                  """
                  if opts.get('changelog') or opts.get('manifest'):
                      file_, rev = None, file_
                  elif rev is None:
                      raise error.CommandError('perfrevlogrevision', 'invalid arguments')
                  r = cmdutil.openrevlog(repo, 'perfrevlogrevision', file_, opts)
                  node = r.lookup(rev)
                  rev = r.rev(node)
                  def dodeltachain(rev):
                      if not cache:
                          r.clearcaches()
                      r._deltachain(rev)
                  def doread(chain):
                      if not cache:
                          r.clearcaches()
                      r._chunkraw(chain[0], chain[-1])
                  def dodecompress(data, chain):
                      if not cache:
                          r.clearcaches()
                      start = r.start
                      length = r.length
                      inline = r._inline
                      iosize = r._io.size
                      buffer = util.buffer
                      offset = start(chain[0])
                      for rev in chain:
                          chunkstart = start(rev)
                          if inline:
                              chunkstart += (rev + 1) * iosize
                          chunklength = length(rev)
                          b = buffer(data, chunkstart - offset, chunklength)
                          revlog.decompress(b)
                  def dopatch(text, bins):
                      if not cache:
                          r.clearcaches()
                      mdiff.patches(text, bins)
                  def dohash(text):
                      if not cache:
                          r.clearcaches()
                      r._checkhash(text, node, rev)
                  def dorevision():
                      if not cache:
                          r.clearcaches()
                      r.revision(node)
                  chain = r._deltachain(rev)[0]
                  data = r._chunkraw(chain[0], chain[-1])[1]
                  bins = r._chunks(chain)
                  text = str(bins[0])
                  bins = bins[1:]
                  text = mdiff.patches(text, bins)
                  benches = [
                      (lambda: dorevision(), 'full'),
                      (lambda: dodeltachain(rev), 'deltachain'),
                      (lambda: doread(chain), 'read'),
                      (lambda: dodecompress(data, chain), 'decompress'),
                      (lambda: dopatch(text, bins), 'patch'),
                      (lambda: dohash(text), 'hash'),
                  ]
                  for fn, title in benches:
                      timer, fm = gettimer(ui, opts)
                      timer(fn, title=title)
                      fm.end()
              @command('perfrevset',
                       [('C', 'clear', False, 'clear volatile cache between each call.'),
                        ('', 'contexts', False, 'obtain changectx for each revision')]
                       + formatteropts, "REVSET")
              def perfrevset(ui, repo, expr, clear=False, contexts=False, **opts):
                  """benchmark the execution time of a revset
                  Use the --clean option if need to evaluate the impact of build volatile
                  revisions set cache on the revset execution. Volatile cache hold filtered
                  and obsolete related cache."""
                  timer, fm = gettimer(ui, opts)
                  def d():
                      if clear:
                          repo.invalidatevolatilesets()
                      if contexts:
                          for ctx in repo.set(expr): pass
                      else:
                          for r in repo.revs(expr): pass
                  timer(d)
                  fm.end()
              @command('perfvolatilesets', formatteropts)
              def perfvolatilesets(ui, repo, *names, **opts):
                  """benchmark the computation of various volatile set
                  Volatile set computes element related to filtering and obsolescence."""
                  timer, fm = gettimer(ui, opts)
                  repo = repo.unfiltered()
                  def getobs(name):
                      def d():
                          repo.invalidatevolatilesets()
                          obsolete.getrevs(repo, name)
                      return d
                  allobs = sorted(obsolete.cachefuncs)
                  if names:
                      allobs = [n for n in allobs if n in names]
                  for name in allobs:
                      timer(getobs(name), title=name)
                  def getfiltered(name):
                      def d():
                          repo.invalidatevolatilesets()
                          repoview.filterrevs(repo, name)
                      return d
                  allfilter = sorted(repoview.filtertable)
                  if names:
                      allfilter = [n for n in allfilter if n in names]
                  for name in allfilter:
                      timer(getfiltered(name), title=name)
                  fm.end()
              @command('perfbranchmap',
                       [('f', 'full', False,
                         'Includes build time of subset'),
                       ] + formatteropts)
              def perfbranchmap(ui, repo, full=False, **opts):
                  """benchmark the update of a branchmap
                  This benchmarks the full repo.branchmap() call with read and write disabled
                  """
                  timer, fm = gettimer(ui, opts)
                  def getbranchmap(filtername):
                      """generate a benchmark function for the filtername"""
                      if filtername is None:
                          view = repo
                      else:
                          view = repo.filtered(filtername)
                      def d():
                          if full:
                              view._branchcaches.clear()
                          else:
                              view._branchcaches.pop(filtername, None)
                          view.branchmap()
                      return d
                  # add filter in smaller subset to bigger subset
                  possiblefilters = set(repoview.filtertable)
                  subsettable = getbranchmapsubsettable()
                  allfilters = []
                  while possiblefilters:
                      for name in possiblefilters:
                          subset = subsettable.get(name)
                          if subset not in possiblefilters:
                              break
                      else:
                          assert False, 'subset cycle %s!' % possiblefilters
                      allfilters.append(name)
                      possiblefilters.remove(name)
                  # warm the cache
                  if not full:
                      for name in allfilters:
                          repo.filtered(name).branchmap()
                  # add unfiltered
                  allfilters.append(None)
                  branchcacheread = safeattrsetter(branchmap, 'read')
                  branchcachewrite = safeattrsetter(branchmap.branchcache, 'write')
                  branchcacheread.set(lambda repo: None)
                  branchcachewrite.set(lambda bc, repo: None)
                  try:
                      for name in allfilters:
                          timer(getbranchmap(name), title=str(name))
                  finally:
                      branchcacheread.restore()
                      branchcachewrite.restore()
                  fm.end()
              @command('perfloadmarkers')
              def perfloadmarkers(ui, repo):
                  """benchmark the time to parse the on-disk markers for a repo
                  Result is the number of markers in the repo."""
                  timer, fm = gettimer(ui)
                  svfs = getsvfs(repo)
                  timer(lambda: len(obsolete.obsstore(svfs)))
                  fm.end()
              @command('perflrucachedict', formatteropts +
                  [('', 'size', 4, 'size of cache'),
                   ('', 'gets', 10000, 'number of key lookups'),
                   ('', 'sets', 10000, 'number of key sets'),
                   ('', 'mixed', 10000, 'number of mixed mode operations'),
                   ('', 'mixedgetfreq', 50, 'frequency of get vs set ops in mixed mode')],
                  norepo=True)
              def perflrucache(ui, size=4, gets=10000, sets=10000, mixed=10000,
                               mixedgetfreq=50, **opts):
                  def doinit():
                      for i in xrange(10000):
                          util.lrucachedict(size)
                  values = []
                  for i in xrange(size):
                      values.append(random.randint(0, sys.maxint))
                  # Get mode fills the cache and tests raw lookup performance with no
                  # eviction.
                  getseq = []
                  for i in xrange(gets):
                      getseq.append(random.choice(values))
                  def dogets():
                      d = util.lrucachedict(size)
                      for v in values:
                          d[v] = v
                      for key in getseq:
                          value = d[key]
                          value # silence pyflakes warning
                  # Set mode tests insertion speed with cache eviction.
                  setseq = []
                  for i in xrange(sets):
                      setseq.append(random.randint(0, sys.maxint))
                  def dosets():
                      d = util.lrucachedict(size)
                      for v in setseq:
                          d[v] = v
                  # Mixed mode randomly performs gets and sets with eviction.
                  mixedops = []
                  for i in xrange(mixed):
                      r = random.randint(0, 100)
                      if r < mixedgetfreq:
                          op = 0
                      else:
                          op = 1
                      mixedops.append((op, random.randint(0, size * 2)))
                  def domixed():
                      d = util.lrucachedict(size)
                      for op, v in mixedops:
                          if op == 0:
                              try:
                                  d[v]
                              except KeyError:
                                  pass
                          else:
                              d[v] = v
                  benches = [
                      (doinit, 'init'),
                      (dogets, 'gets'),
                      (dosets, 'sets'),
                      (domixed, 'mixed')
                  ]
                  for fn, title in benches:
                      timer, fm = gettimer(ui, opts)
                      timer(fn, title=title)
                      fm.end()
              def uisetup(ui):
                  if (util.safehasattr(cmdutil, 'openrevlog') and
                      not util.safehasattr(commands, 'debugrevlogopts')):
                      # for "historical portability":
                      # In this case, Mercurial should be 1.9 (or a79fea6b3e77) -
                      # 3.7 (or 5606f7d0d063). Therefore, '--dir' option for
                      # openrevlog() should cause failure, because it has been
                      # available since 3.5 (or 49c583ca48c4).
                      def openrevlog(orig, repo, cmd, file_, opts):
                          if opts.get('dir') and not util.safehasattr(repo, 'dirlog'):
                              raise error.Abort("This version doesn't support --dir option",
                                                hint="use 3.5 or later")
                          return orig(repo, cmd, file_, opts)
                      extensions.wrapfunction(cmdutil, 'openrevlog', openrevlog)

mercurial/manifest.py

0 +4 -4

              # manifest.py - manifest revision class for mercurial
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import array
              import heapq
              import os
              import struct
              from .i18n import _
              from . import (
                  error,
                  mdiff,
                  parsers,
                  revlog,
                  util,
              )
              propertycache = util.propertycache
              def _parsev1(data):
                  # This method does a little bit of excessive-looking
                  # precondition checking. This is so that the behavior of this
                  # class exactly matches its C counterpart to try and help
                  # prevent surprise breakage for anyone that develops against
                  # the pure version.
                  if data and data[-1] != '\n':
                      raise ValueError('Manifest did not end in a newline.')
                  prev = None
                  for l in data.splitlines():
                      if prev is not None and prev > l:
                          raise ValueError('Manifest lines not in sorted order.')
                      prev = l
                      f, n = l.split('\0')
                      if len(n) > 40:
                          yield f, revlog.bin(n[:40]), n[40:]
                      else:
                          yield f, revlog.bin(n), ''
              def _parsev2(data):
                  metadataend = data.find('\n')
                  # Just ignore metadata for now
                  pos = metadataend + 1
                  prevf = ''
                  while pos < len(data):
                      end = data.find('\n', pos + 1) # +1 to skip stem length byte
                      if end == -1:
                          raise ValueError('Manifest ended with incomplete file entry.')
                      stemlen = ord(data[pos])
                      items = data[pos + 1:end].split('\0')
                      f = prevf[:stemlen] + items[0]
                      if prevf > f:
                          raise ValueError('Manifest entries not in sorted order.')
                      fl = items[1]
                      # Just ignore metadata (items[2:] for now)
                      n = data[end + 1:end + 21]
                      yield f, n, fl
                      pos = end + 22
                      prevf = f
              def _parse(data):
                  """Generates (path, node, flags) tuples from a manifest text"""
                  if data.startswith('\0'):
                      return iter(_parsev2(data))
                  else:
                      return iter(_parsev1(data))
              def _text(it, usemanifestv2):
                  """Given an iterator over (path, node, flags) tuples, returns a manifest
                  text"""
                  if usemanifestv2:
                      return _textv2(it)
                  else:
                      return _textv1(it)
              def _textv1(it):
                  files = []
                  lines = []
                  _hex = revlog.hex
                  for f, n, fl in it:
                      files.append(f)
                      # if this is changed to support newlines in filenames,
                      # be sure to check the templates/ dir again (especially *-raw.tmpl)
                      lines.append("%s\0%s%s\n" % (f, _hex(n), fl))
                  _checkforbidden(files)
                  return ''.join(lines)
              def _textv2(it):
                  files = []
                  lines = ['\0\n']
                  prevf = ''
                  for f, n, fl in it:
                      files.append(f)
                      stem = os.path.commonprefix([prevf, f])
                      stemlen = min(len(stem), 255)
                      lines.append("%c%s\0%s\n%s\n" % (stemlen, f[stemlen:], fl, n))
                      prevf = f
                  _checkforbidden(files)
                  return ''.join(lines)
              class lazymanifestiter(object):
                  def __init__(self, lm):
                      self.pos = 0
                      self.lm = lm
                  def __iter__(self):
                      return self
                  def next(self):
                      try:
                          data, pos = self.lm._get(self.pos)
                      except IndexError:
                          raise StopIteration
                      if pos == -1:
                          self.pos += 1
                          return data[0]
                      self.pos += 1
                      zeropos = data.find('\x00', pos)
                      return data[pos:zeropos]
              class lazymanifestiterentries(object):
                  def __init__(self, lm):
                      self.lm = lm
                      self.pos = 0
                  def __iter__(self):
                      return self
                  def next(self):
                      try:
                          data, pos = self.lm._get(self.pos)
                      except IndexError:
                          raise StopIteration
                      if pos == -1:
                          self.pos += 1
                          return data
                      zeropos = data.find('\x00', pos)
                      hashval = unhexlify(data, self.lm.extrainfo[self.pos],
                                          zeropos + 1, 40)
                      flags = self.lm._getflags(data, self.pos, zeropos)
                      self.pos += 1
                      return (data[pos:zeropos], hashval, flags)
              def unhexlify(data, extra, pos, length):
                  s = data[pos:pos + length].decode('hex')
                  if extra:
                      s += chr(extra & 0xff)
                  return s
              def _cmp(a, b):
                  return (a > b) - (a < b)
              class _lazymanifest(object):
                  def __init__(self, data, positions=None, extrainfo=None, extradata=None):
                      if positions is None:
                          self.positions = self.findlines(data)
                          self.extrainfo = [0] * len(self.positions)
                          self.data = data
                          self.extradata = []
                      else:
                          self.positions = positions[:]
                          self.extrainfo = extrainfo[:]
                          self.extradata = extradata[:]
                          self.data = data
                  def findlines(self, data):
                      if not data:
                          return []
                      pos = data.find("\n")
                      if pos == -1 or data[-1] != '\n':
                          raise ValueError("Manifest did not end in a newline.")
                      positions = [0]
                      prev = data[:data.find('\x00')]
                      while pos < len(data) - 1 and pos != -1:
                          positions.append(pos + 1)
                          nexts = data[pos + 1:data.find('\x00', pos + 1)]
                          if nexts < prev:
                              raise ValueError("Manifest lines not in sorted order.")
                          prev = nexts
                          pos = data.find("\n", pos + 1)
                      return positions
                  def _get(self, index):
                      # get the position encoded in pos:
                      #   positive number is an index in 'data'
                      #   negative number is in extrapieces
                      pos = self.positions[index]
                      if pos >= 0:
                          return self.data, pos
                      return self.extradata[-pos - 1], -1
                  def _getkey(self, pos):
                      if pos >= 0:
                          return self.data[pos:self.data.find('\x00', pos + 1)]
                      return self.extradata[-pos - 1][0]
                  def bsearch(self, key):
                      first = 0
                      last = len(self.positions) - 1
                      while first <= last:
                          midpoint = (first + last)//2
                          nextpos = self.positions[midpoint]
                          candidate = self._getkey(nextpos)
                          r = _cmp(key, candidate)
                          if r == 0:
                              return midpoint
                          else:
                              if r < 0:
                                  last = midpoint - 1
                              else:
                                  first = midpoint + 1
                      return -1
                  def bsearch2(self, key):
                      # same as the above, but will always return the position
                      # done for performance reasons
                      first = 0
                      last = len(self.positions) - 1
                      while first <= last:
                          midpoint = (first + last)//2
                          nextpos = self.positions[midpoint]
                          candidate = self._getkey(nextpos)
                          r = _cmp(key, candidate)
                          if r == 0:
                              return (midpoint, True)
                          else:
                              if r < 0:
                                  last = midpoint - 1
                              else:
                                  first = midpoint + 1
                      return (first, False)
                  def __contains__(self, key):
                      return self.bsearch(key) != -1
                  def _getflags(self, data, needle, pos):
                      start = pos + 41
                      end = data.find("\n", start)
                      if end == -1:
                          end = len(data) - 1
                      if start == end:
                          return ''
                      return self.data[start:end]
                  def __getitem__(self, key):
                      if not isinstance(key, str):
                          raise TypeError("getitem: manifest keys must be a string.")
                      needle = self.bsearch(key)
                      if needle == -1:
                          raise KeyError
                      data, pos = self._get(needle)
                      if pos == -1:
                          return (data[1], data[2])
                      zeropos = data.find('\x00', pos)
                      assert 0 <= needle <= len(self.positions)
                      assert len(self.extrainfo) == len(self.positions)
                      hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, 40)
                      flags = self._getflags(data, needle, zeropos)
                      return (hashval, flags)
                  def __delitem__(self, key):
                      needle, found = self.bsearch2(key)
                      if not found:
                          raise KeyError
                      cur = self.positions[needle]
                      self.positions = self.positions[:needle] + self.positions[needle + 1:]
                      self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1:]
                      if cur >= 0:
                          self.data = self.data[:cur] + '\x00' + self.data[cur + 1:]
                  def __setitem__(self, key, value):
                      if not isinstance(key, str):
                          raise TypeError("setitem: manifest keys must be a string.")
                      if not isinstance(value, tuple) or len(value) != 2:
                          raise TypeError("Manifest values must be a tuple of (node, flags).")
                      hashval = value[0]
                      if not isinstance(hashval, str) or not 20 <= len(hashval) <= 22:
                          raise TypeError("node must be a 20-byte string")
                      flags = value[1]
                      if len(hashval) == 22:
                          hashval = hashval[:-1]
                      if not isinstance(flags, str) or len(flags) > 1:
                          raise TypeError("flags must a 0 or 1 byte string, got %r", flags)
                      needle, found = self.bsearch2(key)
                      if found:
                          # put the item
                          pos = self.positions[needle]
                          if pos < 0:
                              self.extradata[-pos - 1] = (key, hashval, value[1])
                          else:
                              # just don't bother
                              self.extradata.append((key, hashval, value[1]))
                              self.positions[needle] = -len(self.extradata)
                      else:
                          # not found, put it in with extra positions
                          self.extradata.append((key, hashval, value[1]))
                          self.positions = (self.positions[:needle] + [-len(self.extradata)]
                                            + self.positions[needle:])
                          self.extrainfo = (self.extrainfo[:needle] + [0] +
                                            self.extrainfo[needle:])
                  def copy(self):
                      # XXX call _compact like in C?
                      return _lazymanifest(self.data, self.positions, self.extrainfo,
                          self.extradata)
                  def _compact(self):
                      # hopefully not called TOO often
                      if len(self.extradata) == 0:
                          return
                      l = []
                      last_cut = 0
                      i = 0
                      offset = 0
                      self.extrainfo = [0] * len(self.positions)
                      while i < len(self.positions):
                          if self.positions[i] >= 0:
                              cur = self.positions[i]
                              last_cut = cur
                              while True:
                                  self.positions[i] = offset
                                  i += 1
                                  if i == len(self.positions) or self.positions[i] < 0:
                                      break
                                  offset += self.positions[i] - cur
                                  cur = self.positions[i]
                              end_cut = self.data.find('\n', cur)
                              if end_cut != -1:
                                  end_cut += 1
                              offset += end_cut - cur
                              l.append(self.data[last_cut:end_cut])
                          else:
                              while i < len(self.positions) and self.positions[i] < 0:
                                  cur = self.positions[i]
                                  t = self.extradata[-cur - 1]
                                  l.append(self._pack(t))
                                  self.positions[i] = offset
                                  if len(t[1]) > 20:
                                      self.extrainfo[i] = ord(t[1][21])
                                  offset += len(l[-1])
                                  i += 1
                      self.data = ''.join(l)
                      self.extradata = []
                  def _pack(self, d):
                      return d[0] + '\x00' + d[1][:20].encode('hex') + d[2] + '\n'
                  def text(self):
                      self._compact()
                      return self.data
                  def diff(self, m2, clean=False):
                      '''Finds changes between the current manifest and m2.'''
                      # XXX think whether efficiency matters here
                      diff = {}
                      for fn, e1, flags in self.iterentries():
                          if fn not in m2:
                              diff[fn] = (e1, flags), (None, '')
                          else:
                              e2 = m2[fn]
                              if (e1, flags) != e2:
                                  diff[fn] = (e1, flags), e2
                              elif clean:
                                  diff[fn] = None
                      for fn, e2, flags in m2.iterentries():
                          if fn not in self:
                              diff[fn] = (None, ''), (e2, flags)
                      return diff
                  def iterentries(self):
                      return lazymanifestiterentries(self)
                  def iterkeys(self):
                      return lazymanifestiter(self)
                  def __iter__(self):
                      return lazymanifestiter(self)
                  def __len__(self):
                      return len(self.positions)
                  def filtercopy(self, filterfn):
                      # XXX should be optimized
                      c = _lazymanifest('')
                      for f, n, fl in self.iterentries():
                          if filterfn(f):
                              c[f] = n, fl
                      return c
              try:
                  _lazymanifest = parsers.lazymanifest
              except AttributeError:
                  pass
              class manifestdict(object):
                  def __init__(self, data=''):
                      if data.startswith('\0'):
                          #_lazymanifest can not parse v2
                          self._lm = _lazymanifest('')
                          for f, n, fl in _parsev2(data):
                              self._lm[f] = n, fl
                      else:
                          self._lm = _lazymanifest(data)
                  def __getitem__(self, key):
                      return self._lm[key][0]
                  def find(self, key):
                      return self._lm[key]
                  def __len__(self):
                      return len(self._lm)
                  def __nonzero__(self):
                      # nonzero is covered by the __len__ function, but implementing it here
                      # makes it easier for extensions to override.
                      return len(self._lm) != 0
                  def __setitem__(self, key, node):
                      self._lm[key] = node, self.flags(key, '')
                  def __contains__(self, key):
                      return key in self._lm
                  def __delitem__(self, key):
                      del self._lm[key]
                  def __iter__(self):
                      return self._lm.__iter__()
                  def iterkeys(self):
                      return self._lm.iterkeys()
                  def keys(self):
                      return list(self.iterkeys())
                  def filesnotin(self, m2):
                      '''Set of files in this manifest that are not in the other'''
                      diff = self.diff(m2)
                      files = set(filepath
                                  for filepath, hashflags in diff.iteritems()
                                  if hashflags[1][0] is None)
                      return files
                  @propertycache
                  def _dirs(self):
                      return util.dirs(self)
                  def dirs(self):
                      return self._dirs
                  def hasdir(self, dir):
                      return dir in self._dirs
                  def _filesfastpath(self, match):
                      '''Checks whether we can correctly and quickly iterate over matcher
                      files instead of over manifest files.'''
                      files = match.files()
                      return (len(files) < 100 and (match.isexact() or
                          (match.prefix() and all(fn in self for fn in files))))
                  def walk(self, match):
                      '''Generates matching file names.
                      Equivalent to manifest.matches(match).iterkeys(), but without creating
                      an entirely new manifest.
                      It also reports nonexistent files by marking them bad with match.bad().
                      '''
                      if match.always():
                          for f in iter(self):
                              yield f
                          return
                      fset = set(match.files())
                      # avoid the entire walk if we're only looking for specific files
                      if self._filesfastpath(match):
                          for fn in sorted(fset):
                              yield fn
                          return
                      for fn in self:
                          if fn in fset:
                              # specified pattern is the exact name
                              fset.remove(fn)
                          if match(fn):
                              yield fn
                      # for dirstate.walk, files=['.'] means "walk the whole tree".
                      # follow that here, too
                      fset.discard('.')
                      for fn in sorted(fset):
                          if not self.hasdir(fn):
                              match.bad(fn, None)
                  def matches(self, match):
                      '''generate a new manifest filtered by the match argument'''
                      if match.always():
                          return self.copy()
                      if self._filesfastpath(match):
                          m = manifestdict()
                          lm = self._lm
                          for fn in match.files():
                              if fn in lm:
                                  m._lm[fn] = lm[fn]
                          return m
                      m = manifestdict()
                      m._lm = self._lm.filtercopy(match)
                      return m
                  def diff(self, m2, clean=False):
                      '''Finds changes between the current manifest and m2.
                      Args:
                        m2: the manifest to which this manifest should be compared.
                        clean: if true, include files unchanged between these manifests
                               with a None value in the returned dictionary.
                      The result is returned as a dict with filename as key and
                      values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                      nodeid in the current/other manifest and fl1/fl2 is the flag
                      in the current/other manifest. Where the file does not exist,
                      the nodeid will be None and the flags will be the empty
                      string.
                      '''
                      return self._lm.diff(m2._lm, clean)
                  def setflag(self, key, flag):
                      self._lm[key] = self[key], flag
                  def get(self, key, default=None):
                      try:
                          return self._lm[key][0]
                      except KeyError:
                          return default
                  def flags(self, key, default=''):
                      try:
                          return self._lm[key][1]
                      except KeyError:
                          return default
                  def copy(self):
                      c = manifestdict()
                      c._lm = self._lm.copy()
                      return c
                  def iteritems(self):
                      return (x[:2] for x in self._lm.iterentries())
                  def iterentries(self):
                      return self._lm.iterentries()
                  def text(self, usemanifestv2=False):
                      if usemanifestv2:
                          return _textv2(self._lm.iterentries())
                      else:
                          # use (probably) native version for v1
                          return self._lm.text()
                  def fastdelta(self, base, changes):
                      """Given a base manifest text as an array.array and a list of changes
                      relative to that text, compute a delta that can be used by revlog.
                      """
                      delta = []
                      dstart = None
                      dend = None
                      dline = [""]
                      start = 0
                      # zero copy representation of base as a buffer
                      addbuf = util.buffer(base)
                      changes = list(changes)
                      if len(changes) < 1000:
                          # start with a readonly loop that finds the offset of
                          # each line and creates the deltas
                          for f, todelete in changes:
                              # bs will either be the index of the item or the insert point
                              start, end = _msearch(addbuf, f, start)
                              if not todelete:
                                  h, fl = self._lm[f]
                                  l = "%s\0%s%s\n" % (f, revlog.hex(h), fl)
                              else:
                                  if start == end:
                                      # item we want to delete was not found, error out
                                      raise AssertionError(
                                              _("failed to remove %s from manifest") % f)
                                  l = ""
                              if dstart is not None and dstart <= start and dend >= start:
                                  if dend < end:
                                      dend = end
                                  if l:
                                      dline.append(l)
                              else:
                                  if dstart is not None:
                                      delta.append([dstart, dend, "".join(dline)])
                                  dstart = start
                                  dend = end
                                  dline = [l]
                          if dstart is not None:
                              delta.append([dstart, dend, "".join(dline)])
                          # apply the delta to the base, and get a delta for addrevision
                          deltatext, arraytext = _addlistdelta(base, delta)
                      else:
                          # For large changes, it's much cheaper to just build the text and
                          # diff it.
                          arraytext = array.array('c', self.text())
                          deltatext = mdiff.textdiff(base, arraytext)
                      return arraytext, deltatext
              def _msearch(m, s, lo=0, hi=None):
                  '''return a tuple (start, end) that says where to find s within m.
                  If the string is found m[start:end] are the line containing
                  that string.  If start == end the string was not found and
                  they indicate the proper sorted insertion point.
                  m should be a buffer or a string
                  s is a string'''
                  def advance(i, c):
                      while i < lenm and m[i] != c:
                          i += 1
                      return i
                  if not s:
                      return (lo, lo)
                  lenm = len(m)
                  if not hi:
                      hi = lenm
                  while lo < hi:
                      mid = (lo + hi) // 2
                      start = mid
                      while start > 0 and m[start - 1] != '\n':
                          start -= 1
                      end = advance(start, '\0')
                      if m[start:end] < s:
                          # we know that after the null there are 40 bytes of sha1
                          # this translates to the bisect lo = mid + 1
                          lo = advance(end + 40, '\n') + 1
                      else:
                          # this translates to the bisect hi = mid
                          hi = start
                  end = advance(lo, '\0')
                  found = m[lo:end]
                  if s == found:
                      # we know that after the null there are 40 bytes of sha1
                      end = advance(end + 40, '\n')
                      return (lo, end + 1)
                  else:
                      return (lo, lo)
              def _checkforbidden(l):
                  """Check filenames for illegal characters."""
                  for f in l:
                      if '\n' in f or '\r' in f:
                          raise error.RevlogError(
                              _("'\\n' and '\\r' disallowed in filenames: %r") % f)
              # apply the changes collected during the bisect loop to our addlist
              # return a delta suitable for addrevision
              def _addlistdelta(addlist, x):
                  # for large addlist arrays, building a new array is cheaper
                  # than repeatedly modifying the existing one
                  currentposition = 0
                  newaddlist = array.array('c')
                  for start, end, content in x:
                      newaddlist += addlist[currentposition:start]
                      if content:
                          newaddlist += array.array('c', content)
                      currentposition = end
                  newaddlist += addlist[currentposition:]
                  deltatext = "".join(struct.pack(">lll", start, end, len(content))
                                 + content for start, end, content in x)
                  return deltatext, newaddlist
              def _splittopdir(f):
                  if '/' in f:
                      dir, subpath = f.split('/', 1)
                      return dir + '/', subpath
                  else:
                      return '', f
              _noop = lambda s: None
              class treemanifest(object):
                  def __init__(self, dir='', text=''):
                      self._dir = dir
                      self._node = revlog.nullid
                      self._loadfunc = _noop
                      self._copyfunc = _noop
                      self._dirty = False
                      self._dirs = {}
                      # Using _lazymanifest here is a little slower than plain old dicts
                      self._files = {}
                      self._flags = {}
                      if text:
                          def readsubtree(subdir, subm):
                              raise AssertionError('treemanifest constructor only accepts '
                                                   'flat manifests')
                          self.parse(text, readsubtree)
                          self._dirty = True # Mark flat manifest dirty after parsing
                  def _subpath(self, path):
                      return self._dir + path
                  def __len__(self):
                      self._load()
                      size = len(self._files)
                      for m in self._dirs.values():
                          size += m.__len__()
                      return size
                  def _isempty(self):
                      self._load() # for consistency; already loaded by all callers
                      return (not self._files and (not self._dirs or
                              all(m._isempty() for m in self._dirs.values())))
                  def __repr__(self):
                      return ('<treemanifest dir=%s, node=%s, loaded=%s, dirty=%s at 0x%x>' %
                              (self._dir, revlog.hex(self._node),
                               bool(self._loadfunc is _noop),
                               self._dirty, id(self)))
                  def dir(self):
                      '''The directory that this tree manifest represents, including a
                      trailing '/'. Empty string for the repo root directory.'''
                      return self._dir
                  def node(self):
                      '''This node of this instance. nullid for unsaved instances. Should
                      be updated when the instance is read or written from a revlog.
                      '''
                      assert not self._dirty
                      return self._node
                  def setnode(self, node):
                      self._node = node
                      self._dirty = False
                  def iterentries(self):
                      self._load()
                      for p, n in sorted(self._dirs.items() + self._files.items()):
                          if p in self._files:
                              yield self._subpath(p), n, self._flags.get(p, '')
                          else:
                              for x in n.iterentries():
                                  yield x
                  def iteritems(self):
                      self._load()
                      for p, n in sorted(self._dirs.items() + self._files.items()):
                          if p in self._files:
                              yield self._subpath(p), n
                          else:
                              for f, sn in n.iteritems():
                                  yield f, sn
                  def iterkeys(self):
                      self._load()
                      for p in sorted(self._dirs.keys() + self._files.keys()):
                          if p in self._files:
                              yield self._subpath(p)
                          else:
                              for f in self._dirs[p].iterkeys():
                                  yield f
                  def keys(self):
                      return list(self.iterkeys())
                  def __iter__(self):
                      return self.iterkeys()
                  def __contains__(self, f):
                      if f is None:
                          return False
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          if dir not in self._dirs:
                              return False
                          return self._dirs[dir].__contains__(subpath)
                      else:
                          return f in self._files
                  def get(self, f, default=None):
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          if dir not in self._dirs:
                              return default
                          return self._dirs[dir].get(subpath, default)
                      else:
                          return self._files.get(f, default)
                  def __getitem__(self, f):
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          return self._dirs[dir].__getitem__(subpath)
                      else:
                          return self._files[f]
                  def flags(self, f):
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          if dir not in self._dirs:
                              return ''
                          return self._dirs[dir].flags(subpath)
                      else:
                          if f in self._dirs:
                              return ''
                          return self._flags.get(f, '')
                  def find(self, f):
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          return self._dirs[dir].find(subpath)
                      else:
                          return self._files[f], self._flags.get(f, '')
                  def __delitem__(self, f):
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          self._dirs[dir].__delitem__(subpath)
                          # If the directory is now empty, remove it
                          if self._dirs[dir]._isempty():
                              del self._dirs[dir]
                      else:
                          del self._files[f]
                          if f in self._flags:
                              del self._flags[f]
                      self._dirty = True
                  def __setitem__(self, f, n):
                      assert n is not None
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          if dir not in self._dirs:
                              self._dirs[dir] = treemanifest(self._subpath(dir))
                          self._dirs[dir].__setitem__(subpath, n)
                      else:
                          self._files[f] = n[:21] # to match manifestdict's behavior
                      self._dirty = True
                  def _load(self):
                      if self._loadfunc is not _noop:
                          lf, self._loadfunc = self._loadfunc, _noop
                          lf(self)
                      elif self._copyfunc is not _noop:
                          cf, self._copyfunc = self._copyfunc, _noop
                          cf(self)
                  def setflag(self, f, flags):
                      """Set the flags (symlink, executable) for path f."""
                      self._load()
                      dir, subpath = _splittopdir(f)
                      if dir:
                          if dir not in self._dirs:
                              self._dirs[dir] = treemanifest(self._subpath(dir))
                          self._dirs[dir].setflag(subpath, flags)
                      else:
                          self._flags[f] = flags
                      self._dirty = True
                  def copy(self):
                      copy = treemanifest(self._dir)
                      copy._node = self._node
                      copy._dirty = self._dirty
                      if self._copyfunc is _noop:
                          def _copyfunc(s):
                              self._load()
                              for d in self._dirs:
                                  s._dirs[d] = self._dirs[d].copy()
                              s._files = dict.copy(self._files)
                              s._flags = dict.copy(self._flags)
                          if self._loadfunc is _noop:
                              _copyfunc(copy)
                          else:
                              copy._copyfunc = _copyfunc
                      else:
                          copy._copyfunc = self._copyfunc
                      return copy
                  def filesnotin(self, m2):
                      '''Set of files in this manifest that are not in the other'''
                      files = set()
                      def _filesnotin(t1, t2):
                          if t1._node == t2._node and not t1._dirty and not t2._dirty:
                              return
                          t1._load()
                          t2._load()
                          for d, m1 in t1._dirs.iteritems():
                              if d in t2._dirs:
                                  m2 = t2._dirs[d]
                                  _filesnotin(m1, m2)
                              else:
                                  files.update(m1.iterkeys())
                          for fn in t1._files.iterkeys():
                              if fn not in t2._files:
                                  files.add(t1._subpath(fn))
                      _filesnotin(self, m2)
                      return files
                  @propertycache
                  def _alldirs(self):
                      return util.dirs(self)
                  def dirs(self):
                      return self._alldirs
                  def hasdir(self, dir):
                      self._load()
                      topdir, subdir = _splittopdir(dir)
                      if topdir:
                          if topdir in self._dirs:
                              return self._dirs[topdir].hasdir(subdir)
                          return False
                      return (dir + '/') in self._dirs
                  def walk(self, match):
                      '''Generates matching file names.
                      Equivalent to manifest.matches(match).iterkeys(), but without creating
                      an entirely new manifest.
                      It also reports nonexistent files by marking them bad with match.bad().
                      '''
                      if match.always():
                          for f in iter(self):
                              yield f
                          return
                      fset = set(match.files())
                      for fn in self._walk(match):
                          if fn in fset:
                              # specified pattern is the exact name
                              fset.remove(fn)
                          yield fn
                      # for dirstate.walk, files=['.'] means "walk the whole tree".
                      # follow that here, too
                      fset.discard('.')
                      for fn in sorted(fset):
                          if not self.hasdir(fn):
                              match.bad(fn, None)
                  def _walk(self, match):
                      '''Recursively generates matching file names for walk().'''
                      if not match.visitdir(self._dir[:-1] or '.'):
                          return
                      # yield this dir's files and walk its submanifests
                      self._load()
                      for p in sorted(self._dirs.keys() + self._files.keys()):
                          if p in self._files:
                              fullp = self._subpath(p)
                              if match(fullp):
                                  yield fullp
                          else:
                              for f in self._dirs[p]._walk(match):
                                  yield f
                  def matches(self, match):
                      '''generate a new manifest filtered by the match argument'''
                      if match.always():
                          return self.copy()
                      return self._matches(match)
                  def _matches(self, match):
                      '''recursively generate a new manifest filtered by the match argument.
                      '''
                      visit = match.visitdir(self._dir[:-1] or '.')
                      if visit == 'all':
                          return self.copy()
                      ret = treemanifest(self._dir)
                      if not visit:
                          return ret
                      self._load()
                      for fn in self._files:
                          fullp = self._subpath(fn)
                          if not match(fullp):
                              continue
                          ret._files[fn] = self._files[fn]
                          if fn in self._flags:
                              ret._flags[fn] = self._flags[fn]
                      for dir, subm in self._dirs.iteritems():
                          m = subm._matches(match)
                          if not m._isempty():
                              ret._dirs[dir] = m
                      if not ret._isempty():
                          ret._dirty = True
                      return ret
                  def diff(self, m2, clean=False):
                      '''Finds changes between the current manifest and m2.
                      Args:
                        m2: the manifest to which this manifest should be compared.
                        clean: if true, include files unchanged between these manifests
                               with a None value in the returned dictionary.
                      The result is returned as a dict with filename as key and
                      values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                      nodeid in the current/other manifest and fl1/fl2 is the flag
                      in the current/other manifest. Where the file does not exist,
                      the nodeid will be None and the flags will be the empty
                      string.
                      '''
                      result = {}
                      emptytree = treemanifest()
                      def _diff(t1, t2):
                          if t1._node == t2._node and not t1._dirty and not t2._dirty:
                              return
                          t1._load()
                          t2._load()
                          for d, m1 in t1._dirs.iteritems():
                              m2 = t2._dirs.get(d, emptytree)
                              _diff(m1, m2)
                          for d, m2 in t2._dirs.iteritems():
                              if d not in t1._dirs:
                                  _diff(emptytree, m2)
                          for fn, n1 in t1._files.iteritems():
                              fl1 = t1._flags.get(fn, '')
                              n2 = t2._files.get(fn, None)
                              fl2 = t2._flags.get(fn, '')
                              if n1 != n2 or fl1 != fl2:
                                  result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
                              elif clean:
                                  result[t1._subpath(fn)] = None
                          for fn, n2 in t2._files.iteritems():
                              if fn not in t1._files:
                                  fl2 = t2._flags.get(fn, '')
                                  result[t2._subpath(fn)] = ((None, ''), (n2, fl2))
                      _diff(self, m2)
                      return result
                  def unmodifiedsince(self, m2):
                      return not self._dirty and not m2._dirty and self._node == m2._node
                  def parse(self, text, readsubtree):
                      for f, n, fl in _parse(text):
                          if fl == 't':
                              f = f + '/'
                              self._dirs[f] = readsubtree(self._subpath(f), n)
                          elif '/' in f:
                              # This is a flat manifest, so use __setitem__ and setflag rather
                              # than assigning directly to _files and _flags, so we can
                              # assign a path in a subdirectory, and to mark dirty (compared
                              # to nullid).
                              self[f] = n
                              if fl:
                                  self.setflag(f, fl)
                          else:
                              # Assigning to _files and _flags avoids marking as dirty,
                              # and should be a little faster.
                              self._files[f] = n
                              if fl:
                                  self._flags[f] = fl
                  def text(self, usemanifestv2=False):
                      """Get the full data of this manifest as a bytestring."""
                      self._load()
                      return _text(self.iterentries(), usemanifestv2)
                  def dirtext(self, usemanifestv2=False):
                      """Get the full data of this directory as a bytestring. Make sure that
                      any submanifests have been written first, so their nodeids are correct.
                      """
                      self._load()
                      flags = self.flags
                      dirs = [(d[:-1], self._dirs[d]._node, 't') for d in self._dirs]
                      files = [(f, self._files[f], flags(f)) for f in self._files]
                      return _text(sorted(dirs + files), usemanifestv2)
                  def read(self, gettext, readsubtree):
                      def _load_for_read(s):
                          s.parse(gettext(), readsubtree)
                          s._dirty = False
                      self._loadfunc = _load_for_read
                  def writesubtrees(self, m1, m2, writesubtree):
                      self._load() # for consistency; should never have any effect here
                      m1._load()
                      m2._load()
                      emptytree = treemanifest()
                      for d, subm in self._dirs.iteritems():
                          subp1 = m1._dirs.get(d, emptytree)._node
                          subp2 = m2._dirs.get(d, emptytree)._node
                          if subp1 == revlog.nullid:
                              subp1, subp2 = subp2, subp1
                          writesubtree(subm, subp1, subp2)
              class manifestrevlog(revlog.revlog):
                  '''A revlog that stores manifest texts. This is responsible for caching the
                  full-text manifest contents.
                  '''
                  def __init__(self, opener, dir='', dirlogcache=None):
                      # During normal operations, we expect to deal with not more than four
                      # revs at a time (such as during commit --amend). When rebasing large
                      # stacks of commits, the number can go up, hence the config knob below.
                      cachesize = 4
                      usetreemanifest = False
                      usemanifestv2 = False
                      opts = getattr(opener, 'options', None)
                      if opts is not None:
                          cachesize = opts.get('manifestcachesize', cachesize)
                          usetreemanifest = opts.get('treemanifest', usetreemanifest)
                          usemanifestv2 = opts.get('manifestv2', usemanifestv2)
                      self._treeondisk = usetreemanifest
                      self._usemanifestv2 = usemanifestv2
                      self._fulltextcache = util.lrucachedict(cachesize)
                      indexfile = "00manifest.i"
                      if dir:
                          assert self._treeondisk, 'opts is %r' % opts
                          if not dir.endswith('/'):
                              dir = dir + '/'
                          indexfile = "meta/" + dir + "00manifest.i"
                      self._dir = dir
                      # The dirlogcache is kept on the root manifest log
                      if dir:
                          self._dirlogcache = dirlogcache
                      else:
                          self._dirlogcache = {'': self}
                      super(manifestrevlog, self).__init__(opener, indexfile,
                                                           checkambig=bool(dir))
                  @property
                  def fulltextcache(self):
                      return self._fulltextcache
                  def clearcaches(self):
                      super(manifestrevlog, self).clearcaches()
                      self._fulltextcache.clear()
                      self._dirlogcache = {'': self}
                  def dirlog(self, dir):
                      if dir:
                          assert self._treeondisk
                      if dir not in self._dirlogcache:
                          self._dirlogcache[dir] = manifestrevlog(self.opener, dir,
                                                                  self._dirlogcache)
                      return self._dirlogcache[dir]
                  def add(self, m, transaction, link, p1, p2, added, removed, readtree=None):
                      if (p1 in self.fulltextcache and util.safehasattr(m, 'fastdelta')
                          and not self._usemanifestv2):
                          # If our first parent is in the manifest cache, we can
                          # compute a delta here using properties we know about the
                          # manifest up-front, which may save time later for the
                          # revlog layer.
                          _checkforbidden(added)
                          # combine the changed lists into one sorted iterator
                          work = heapq.merge([(x, False) for x in added],
                                             [(x, True) for x in removed])
                          arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)
                          cachedelta = self.rev(p1), deltatext
                          text = util.buffer(arraytext)
                          n = self.addrevision(text, transaction, link, p1, p2, cachedelta)
                      else:
                          # The first parent manifest isn't already loaded, so we'll
                          # just encode a fulltext of the manifest and pass that
                          # through to the revlog layer, and let it handle the delta
                          # process.
                          if self._treeondisk:
                              assert readtree, "readtree must be set for treemanifest writes"
                              m1 = readtree(self._dir, p1)
                              m2 = readtree(self._dir, p2)
                              n = self._addtree(m, transaction, link, m1, m2, readtree)
                              arraytext = None
                          else:
                              text = m.text(self._usemanifestv2)
                              n = self.addrevision(text, transaction, link, p1, p2)
                              arraytext = array.array('c', text)
                      if arraytext is not None:
                          self.fulltextcache[n] = arraytext
                      return n
                  def _addtree(self, m, transaction, link, m1, m2, readtree):
                      # If the manifest is unchanged compared to one parent,
                      # don't write a new revision
                      if m.unmodifiedsince(m1) or m.unmodifiedsince(m2):
                          return m.node()
                      def writesubtree(subm, subp1, subp2):
                          sublog = self.dirlog(subm.dir())
                          sublog.add(subm, transaction, link, subp1, subp2, None, None,
                                     readtree=readtree)
                      m.writesubtrees(m1, m2, writesubtree)
                      text = m.dirtext(self._usemanifestv2)
                      # Double-check whether contents are unchanged to one parent
                      if text == m1.dirtext(self._usemanifestv2):
                          n = m1.node()
                      elif text == m2.dirtext(self._usemanifestv2):
                          n = m2.node()
                      else:
                          n = self.addrevision(text, transaction, link, m1.node(), m2.node())
                      # Save nodeid so parent manifest can calculate its nodeid
                      m.setnode(n)
                      return n
              class manifestlog(object):
                  """A collection class representing the collection of manifest snapshots
                  referenced by commits in the repository.
                  In this situation, 'manifest' refers to the abstract concept of a snapshot
                  of the list of files in the given commit. Consumers of the output of this
                  class do not care about the implementation details of the actual manifests
                  they receive (i.e. tree or flat or lazily loaded, etc)."""
                  def __init__(self, opener, repo):
                      self._repo = repo
                      usetreemanifest = False
                      opts = getattr(opener, 'options', None)
                      if opts is not None:
                          usetreemanifest = opts.get('treemanifest', usetreemanifest)
                      self._treeinmem = usetreemanifest
                      self._oldmanifest = repo._constructmanifest()
                      self._revlog = self._oldmanifest
                      # A cache of the manifestctx or treemanifestctx for each directory
                      self._dirmancache = {}
                      # We'll separate this into it's own cache once oldmanifest is no longer
                      # used
                      self._mancache = self._oldmanifest._mancache
                      self._dirmancache[''] = self._mancache
                      # A future patch makes this use the same config value as the existing
                      # mancache
                      self.cachesize = 4
                  def __getitem__(self, node):
                      """Retrieves the manifest instance for the given node. Throws a
                      LookupError if not found.
                      """
                      return self.get('', node)
                  def get(self, dir, node):
                      """Retrieves the manifest instance for the given node. Throws a
                      LookupError if not found.
                      """
                      if node in self._dirmancache.get(dir, ()):
                          cachemf = self._dirmancache[dir][node]
                          # The old manifest may put non-ctx manifests in the cache, so
                          # skip those since they don't implement the full api.
                          if (isinstance(cachemf, manifestctx) or
                              isinstance(cachemf, treemanifestctx)):
                              return cachemf
                      if dir:
                          if self._revlog._treeondisk:
                              dirlog = self._revlog.dirlog(dir)
                              if node not in dirlog.nodemap:
                                  raise LookupError(node, dirlog.indexfile,
                                                    _('no node'))
                              m = treemanifestctx(self._repo, dir, node)
                          else:
                              raise error.Abort(
                                      _("cannot ask for manifest directory '%s' in a flat "
                                        "manifest") % dir)
                      else:
                          if node not in self._revlog.nodemap:
                              raise LookupError(node, self._revlog.indexfile,
                                                _('no node'))
                          if self._treeinmem:
                              m = treemanifestctx(self._repo, '', node)
                          else:
                              m = manifestctx(self._repo, node)
                      if node != revlog.nullid:
                          mancache = self._dirmancache.get(dir)
                          if not mancache:
                              mancache = util.lrucachedict(self.cachesize)
                              self._dirmancache[dir] = mancache
                          mancache[node] = m
                      return m
+                 def clearcaches(self):
+                     self._dirmancache.clear()
+                     self._revlog.clearcaches()
              class memmanifestctx(object):
                  def __init__(self, repo):
                      self._repo = repo
                      self._manifestdict = manifestdict()
                  def _revlog(self):
                      return self._repo.manifestlog._revlog
                  def new(self):
                      return memmanifestctx(self._repo)
                  def copy(self):
                      memmf = memmanifestctx(self._repo)
                      memmf._manifestdict = self.read().copy()
                      return memmf
                  def read(self):
                      return self._manifestdict
                  def write(self, transaction, link, p1, p2, added, removed):
                      return self._revlog().add(self._manifestdict, transaction, link, p1, p2,
                                                added, removed)
              class manifestctx(object):
                  """A class representing a single revision of a manifest, including its
                  contents, its parent revs, and its linkrev.
                  """
                  def __init__(self, repo, node):
                      self._repo = repo
                      self._data = None
                      self._node = node
                      # TODO: We eventually want p1, p2, and linkrev exposed on this class,
                      # but let's add it later when something needs it and we can load it
                      # lazily.
                      #self.p1, self.p2 = revlog.parents(node)
                      #rev = revlog.rev(node)
                      #self.linkrev = revlog.linkrev(rev)
                  def _revlog(self):
                      return self._repo.manifestlog._revlog
                  def node(self):
                      return self._node
                  def new(self):
                      return memmanifestctx(self._repo)
                  def copy(self):
                      memmf = memmanifestctx(self._repo)
                      memmf._manifestdict = self.read().copy()
                      return memmf
                  def read(self):
                      if not self._data:
                          if self._node == revlog.nullid:
                              self._data = manifestdict()
                          else:
                              rl = self._revlog()
                              text = rl.revision(self._node)
                              arraytext = array.array('c', text)
                              rl._fulltextcache[self._node] = arraytext
                              self._data = manifestdict(text)
                      return self._data
                  def readfast(self, shallow=False):
                      '''Calls either readdelta or read, based on which would be less work.
                      readdelta is called if the delta is against the p1, and therefore can be
                      read quickly.
                      If `shallow` is True, nothing changes since this is a flat manifest.
                      '''
                      rl = self._revlog()
                      r = rl.rev(self._node)
                      deltaparent = rl.deltaparent(r)
                      if deltaparent != revlog.nullrev and deltaparent in rl.parentrevs(r):
                          return self.readdelta()
                      return self.read()
                  def readdelta(self, shallow=False):
                      '''Returns a manifest containing just the entries that are present
                      in this manifest, but not in its p1 manifest. This is efficient to read
                      if the revlog delta is already p1.
                      Changing the value of `shallow` has no effect on flat manifests.
                      '''
                      revlog = self._revlog()
                      if revlog._usemanifestv2:
                          # Need to perform a slow delta
                          r0 = revlog.deltaparent(revlog.rev(self._node))
                          m0 = manifestctx(self._repo, revlog.node(r0)).read()
                          m1 = self.read()
                          md = manifestdict()
                          for f, ((n0, fl0), (n1, fl1)) in m0.diff(m1).iteritems():
                              if n1:
                                  md[f] = n1
                                  if fl1:
                                      md.setflag(f, fl1)
                          return md
                      r = revlog.rev(self._node)
                      d = mdiff.patchtext(revlog.revdiff(revlog.deltaparent(r), r))
                      return manifestdict(d)
                  def find(self, key):
                      return self.read().find(key)
              class memtreemanifestctx(object):
                  def __init__(self, repo, dir=''):
                      self._repo = repo
                      self._dir = dir
                      self._treemanifest = treemanifest()
                  def _revlog(self):
                      return self._repo.manifestlog._revlog
                  def new(self, dir=''):
                      return memtreemanifestctx(self._repo, dir=dir)
                  def copy(self):
                      memmf = memtreemanifestctx(self._repo, dir=self._dir)
                      memmf._treemanifest = self._treemanifest.copy()
                      return memmf
                  def read(self):
                      return self._treemanifest
                  def write(self, transaction, link, p1, p2, added, removed):
                      def readtree(dir, node):
                          return self._repo.manifestlog.get(dir, node).read()
                      return self._revlog().add(self._treemanifest, transaction, link, p1, p2,
                                                added, removed, readtree=readtree)
              class treemanifestctx(object):
                  def __init__(self, repo, dir, node):
                      self._repo = repo
                      self._dir = dir
                      self._data = None
                      self._node = node
                      # TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that
                      # we can instantiate treemanifestctx objects for directories we don't
                      # have on disk.
                      #self.p1, self.p2 = revlog.parents(node)
                      #rev = revlog.rev(node)
                      #self.linkrev = revlog.linkrev(rev)
                  def _revlog(self):
                      return self._repo.manifestlog._revlog.dirlog(self._dir)
                  def read(self):
                      if not self._data:
                          rl = self._revlog()
                          if self._node == revlog.nullid:
                              self._data = treemanifest()
                          elif rl._treeondisk:
                              m = treemanifest(dir=self._dir)
                              def gettext():
                                  return rl.revision(self._node)
                              def readsubtree(dir, subm):
                                  return treemanifestctx(self._repo, dir, subm).read()
                              m.read(gettext, readsubtree)
                              m.setnode(self._node)
                              self._data = m
                          else:
                              text = rl.revision(self._node)
                              arraytext = array.array('c', text)
                              rl.fulltextcache[self._node] = arraytext
                              self._data = treemanifest(dir=self._dir, text=text)
                      return self._data
                  def node(self):
                      return self._node
                  def new(self, dir=''):
                      return memtreemanifestctx(self._repo, dir=dir)
                  def copy(self):
                      memmf = memtreemanifestctx(self._repo, dir=self._dir)
                      memmf._treemanifest = self.read().copy()
                      return memmf
                  def readdelta(self, shallow=False):
                      '''Returns a manifest containing just the entries that are present
                      in this manifest, but not in its p1 manifest. This is efficient to read
                      if the revlog delta is already p1.
                      If `shallow` is True, this will read the delta for this directory,
                      without recursively reading subdirectory manifests. Instead, any
                      subdirectory entry will be reported as it appears in the manifest, i.e.
                      the subdirectory will be reported among files and distinguished only by
                      its 't' flag.
                      '''
                      revlog = self._revlog()
                      if shallow and not revlog._usemanifestv2:
                          r = revlog.rev(self._node)
                          d = mdiff.patchtext(revlog.revdiff(revlog.deltaparent(r), r))
                          return manifestdict(d)
                      else:
                          # Need to perform a slow delta
                          r0 = revlog.deltaparent(revlog.rev(self._node))
                          m0 = treemanifestctx(self._repo, self._dir, revlog.node(r0)).read()
                          m1 = self.read()
                          md = treemanifest(dir=self._dir)
                          for f, ((n0, fl0), (n1, fl1)) in m0.diff(m1).iteritems():
                              if n1:
                                  md[f] = n1
                                  if fl1:
                                      md.setflag(f, fl1)
                          return md
                  def readfast(self, shallow=False):
                      '''Calls either readdelta or read, based on which would be less work.
                      readdelta is called if the delta is against the p1, and therefore can be
                      read quickly.
                      If `shallow` is True, it only returns the entries from this manifest,
                      and not any submanifests.
                      '''
                      rl = self._revlog()
                      r = rl.rev(self._node)
                      deltaparent = rl.deltaparent(r)
                      if (deltaparent != revlog.nullrev and
                          deltaparent in rl.parentrevs(r)):
                          return self.readdelta(shallow=shallow)
                      if shallow:
                          return manifestdict(rl.revision(self._node))
                      else:
                          return self.read()
                  def find(self, key):
                      return self.read().find(key)
              class manifest(manifestrevlog):
                  def __init__(self, opener, dir='', dirlogcache=None):
                      '''The 'dir' and 'dirlogcache' arguments are for internal use by
                      manifest.manifest only. External users should create a root manifest
                      log with manifest.manifest(opener) and call dirlog() on it.
                      '''
                      # During normal operations, we expect to deal with not more than four
                      # revs at a time (such as during commit --amend). When rebasing large
                      # stacks of commits, the number can go up, hence the config knob below.
                      cachesize = 4
                      usetreemanifest = False
                      opts = getattr(opener, 'options', None)
                      if opts is not None:
                          cachesize = opts.get('manifestcachesize', cachesize)
                          usetreemanifest = opts.get('treemanifest', usetreemanifest)
                      self._mancache = util.lrucachedict(cachesize)
                      self._treeinmem = usetreemanifest
                      super(manifest, self).__init__(opener, dir=dir, dirlogcache=dirlogcache)
                  def _newmanifest(self, data=''):
                      if self._treeinmem:
                          return treemanifest(self._dir, data)
                      return manifestdict(data)
                  def dirlog(self, dir):
                      """This overrides the base revlog implementation to allow construction
                      'manifest' types instead of manifestrevlog types. This is only needed
                      until we migrate off the 'manifest' type."""
                      if dir:
                          assert self._treeondisk
                      if dir not in self._dirlogcache:
                          self._dirlogcache[dir] = manifest(self.opener, dir,
                                                            self._dirlogcache)
                      return self._dirlogcache[dir]
-                 def clearcaches(self):
-                     super(manifest, self).clearcaches()
-                     self._mancache.clear()

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No reviewers

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages