upstream/mercurial-mirror Commit - r51389:e50d1fe7

store: issue a single entry for each revlog...

marmoute -

r51389:e50d1fe7 default

parent child

mercurial/repair.py

0 +1 -3

              # repair.py - functions for repository repair for mercurial
              #
              # Copyright 2005, 2006 Chris Mason <mason@suse.com>
              # Copyright 2007 Olivia Mackall
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from .i18n import _
              from .node import (
                  hex,
                  short,
              )
              from . import (
                  bundle2,
                  changegroup,
                  discovery,
                  error,
                  exchange,
                  obsolete,
                  obsutil,
                  pathutil,
                  phases,
                  requirements,
                  scmutil,
                  store,
                  transaction,
                  util,
              )
              from .utils import (
                  hashutil,
                  urlutil,
              )
              def backupbundle(
                  repo,
                  bases,
                  heads,
                  node,
                  suffix,
                  compress=True,
                  obsolescence=True,
                  tmp_backup=False,
              ):
                  """create a bundle with the specified revisions as a backup"""
                  backupdir = b"strip-backup"
                  vfs = repo.vfs
                  if not vfs.isdir(backupdir):
                      vfs.mkdir(backupdir)
                  # Include a hash of all the nodes in the filename for uniqueness
                  allcommits = repo.set(b'%ln::%ln', bases, heads)
                  allhashes = sorted(c.hex() for c in allcommits)
                  totalhash = hashutil.sha1(b''.join(allhashes)).digest()
                  name = b"%s/%s-%s-%s.hg" % (
                      backupdir,
                      short(node),
                      hex(totalhash[:4]),
                      suffix,
                  )
                  cgversion = changegroup.localversion(repo)
                  comp = None
                  if cgversion != b'01':
                      bundletype = b"HG20"
                      if compress:
                          comp = b'BZ'
                  elif compress:
                      bundletype = b"HG10BZ"
                  else:
                      bundletype = b"HG10UN"
                  outgoing = discovery.outgoing(repo, missingroots=bases, ancestorsof=heads)
                  contentopts = {
                      b'cg.version': cgversion,
                      b'obsolescence': obsolescence,
                      b'phases': True,
                  }
                  return bundle2.writenewbundle(
                      repo.ui,
                      repo,
                      b'strip',
                      name,
                      bundletype,
                      outgoing,
                      contentopts,
                      vfs,
                      compression=comp,
                      allow_internal=tmp_backup,
                  )
              def _collectfiles(repo, striprev):
                  """find out the filelogs affected by the strip"""
                  files = set()
                  for x in range(striprev, len(repo)):
                      files.update(repo[x].files())
                  return sorted(files)
              def _collectrevlog(revlog, striprev):
                  _, brokenset = revlog.getstrippoint(striprev)
                  return [revlog.linkrev(r) for r in brokenset]
              def _collectbrokencsets(repo, files, striprev):
                  """return the changesets which will be broken by the truncation"""
                  s = set()
                  for revlog in manifestrevlogs(repo):
                      s.update(_collectrevlog(revlog, striprev))
                  for fname in files:
                      s.update(_collectrevlog(repo.file(fname), striprev))
                  return s
              def strip(ui, repo, nodelist, backup=True, topic=b'backup'):
                  # This function requires the caller to lock the repo, but it operates
                  # within a transaction of its own, and thus requires there to be no current
                  # transaction when it is called.
                  if repo.currenttransaction() is not None:
                      raise error.ProgrammingError(b'cannot strip from inside a transaction')
                  # Simple way to maintain backwards compatibility for this
                  # argument.
                  if backup in [b'none', b'strip']:
                      backup = False
                  repo = repo.unfiltered()
                  repo.destroying()
                  vfs = repo.vfs
                  # load bookmark before changelog to avoid side effect from outdated
                  # changelog (see repo._refreshchangelog)
                  repo._bookmarks
                  cl = repo.changelog
                  # TODO handle undo of merge sets
                  if isinstance(nodelist, bytes):
                      nodelist = [nodelist]
                  striplist = [cl.rev(node) for node in nodelist]
                  striprev = min(striplist)
                  files = _collectfiles(repo, striprev)
                  saverevs = _collectbrokencsets(repo, files, striprev)
                  # Some revisions with rev > striprev may not be descendants of striprev.
                  # We have to find these revisions and put them in a bundle, so that
                  # we can restore them after the truncations.
                  # To create the bundle we use repo.changegroupsubset which requires
                  # the list of heads and bases of the set of interesting revisions.
                  # (head = revision in the set that has no descendant in the set;
                  #  base = revision in the set that has no ancestor in the set)
                  tostrip = set(striplist)
                  saveheads = set(saverevs)
                  for r in cl.revs(start=striprev + 1):
                      if any(p in tostrip for p in cl.parentrevs(r)):
                          tostrip.add(r)
                      if r not in tostrip:
                          saverevs.add(r)
                          saveheads.difference_update(cl.parentrevs(r))
                          saveheads.add(r)
                  saveheads = [cl.node(r) for r in saveheads]
                  # compute base nodes
                  if saverevs:
                      descendants = set(cl.descendants(saverevs))
                      saverevs.difference_update(descendants)
                  savebases = [cl.node(r) for r in saverevs]
                  stripbases = [cl.node(r) for r in tostrip]
                  stripobsidx = obsmarkers = ()
                  if repo.ui.configbool(b'devel', b'strip-obsmarkers'):
                      obsmarkers = obsutil.exclusivemarkers(repo, stripbases)
                  if obsmarkers:
                      stripobsidx = [
                          i for i, m in enumerate(repo.obsstore) if m in obsmarkers
                      ]
                  newbmtarget, updatebm = _bookmarkmovements(repo, tostrip)
                  backupfile = None
                  node = nodelist[-1]
                  if backup:
                      backupfile = _createstripbackup(repo, stripbases, node, topic)
                  # create a changegroup for all the branches we need to keep
                  tmpbundlefile = None
                  if saveheads:
                      # do not compress temporary bundle if we remove it from disk later
                      #
                      # We do not include obsolescence, it might re-introduce prune markers
                      # we are trying to strip.  This is harmless since the stripped markers
                      # are already backed up and we did not touched the markers for the
                      # saved changesets.
                      tmpbundlefile = backupbundle(
                          repo,
                          savebases,
                          saveheads,
                          node,
                          b'temp',
                          compress=False,
                          obsolescence=False,
                          tmp_backup=True,
                      )
                  with ui.uninterruptible():
                      try:
                          with repo.transaction(b"strip") as tr:
                              # TODO this code violates the interface abstraction of the
                              # transaction and makes assumptions that file storage is
                              # using append-only files. We'll need some kind of storage
                              # API to handle stripping for us.
                              oldfiles = set(tr._offsetmap.keys())
                              oldfiles.update(tr._newfiles)
                              tr.startgroup()
                              cl.strip(striprev, tr)
                              stripmanifest(repo, striprev, tr, files)
                              for fn in files:
                                  repo.file(fn).strip(striprev, tr)
                              tr.endgroup()
                              entries = tr.readjournal()
                              for file, troffset in entries:
                                  if file in oldfiles:
                                      continue
                                  with repo.svfs(file, b'a', checkambig=True) as fp:
                                      fp.truncate(troffset)
                                  if troffset == 0:
                                      repo.store.markremoved(file)
                              deleteobsmarkers(repo.obsstore, stripobsidx)
                              del repo.obsstore
                              repo.invalidatevolatilesets()
                              repo._phasecache.filterunknown(repo)
                          if tmpbundlefile:
                              ui.note(_(b"adding branch\n"))
                              f = vfs.open(tmpbundlefile, b"rb")
                              gen = exchange.readbundle(ui, f, tmpbundlefile, vfs)
                              # silence internal shuffling chatter
                              maybe_silent = (
                                  repo.ui.silent()
                                  if not repo.ui.verbose
                                  else util.nullcontextmanager()
                              )
                              with maybe_silent:
                                  tmpbundleurl = b'bundle:' + vfs.join(tmpbundlefile)
                                  txnname = b'strip'
                                  if not isinstance(gen, bundle2.unbundle20):
                                      txnname = b"strip\n%s" % urlutil.hidepassword(
                                          tmpbundleurl
                                      )
                                  with repo.transaction(txnname) as tr:
                                      bundle2.applybundle(
                                          repo, gen, tr, source=b'strip', url=tmpbundleurl
                                      )
                              f.close()
                          with repo.transaction(b'repair') as tr:
                              bmchanges = [(m, repo[newbmtarget].node()) for m in updatebm]
                              repo._bookmarks.applychanges(repo, tr, bmchanges)
                          transaction.cleanup_undo_files(repo.ui.warn, repo.vfs_map)
                      except:  # re-raises
                          if backupfile:
                              ui.warn(
                                  _(b"strip failed, backup bundle stored in '%s'\n")
                                  % vfs.join(backupfile)
                              )
                          if tmpbundlefile:
                              ui.warn(
                                  _(b"strip failed, unrecovered changes stored in '%s'\n")
                                  % vfs.join(tmpbundlefile)
                              )
                              ui.warn(
                                  _(
                                      b"(fix the problem, then recover the changesets with "
                                      b"\"hg unbundle '%s'\")\n"
                                  )
                                  % vfs.join(tmpbundlefile)
                              )
                          raise
                      else:
                          if tmpbundlefile:
                              # Remove temporary bundle only if there were no exceptions
                              vfs.unlink(tmpbundlefile)
                  repo.destroyed()
                  # return the backup file path (or None if 'backup' was False) so
                  # extensions can use it
                  return backupfile
              def softstrip(ui, repo, nodelist, backup=True, topic=b'backup'):
                  """perform a "soft" strip using the archived phase"""
                  tostrip = [c.node() for c in repo.set(b'sort(%ln::)', nodelist)]
                  if not tostrip:
                      return None
                  backupfile = None
                  if backup:
                      node = tostrip[0]
                      backupfile = _createstripbackup(repo, tostrip, node, topic)
                  newbmtarget, updatebm = _bookmarkmovements(repo, tostrip)
                  with repo.transaction(b'strip') as tr:
                      phases.retractboundary(repo, tr, phases.archived, tostrip)
                      bmchanges = [(m, repo[newbmtarget].node()) for m in updatebm]
                      repo._bookmarks.applychanges(repo, tr, bmchanges)
                  return backupfile
              def _bookmarkmovements(repo, tostrip):
                  # compute necessary bookmark movement
                  bm = repo._bookmarks
                  updatebm = []
                  for m in bm:
                      rev = repo[bm[m]].rev()
                      if rev in tostrip:
                          updatebm.append(m)
                  newbmtarget = None
                  # If we need to move bookmarks, compute bookmark
                  # targets. Otherwise we can skip doing this logic.
                  if updatebm:
                      # For a set s, max(parents(s) - s) is the same as max(heads(::s - s)),
                      # but is much faster
                      newbmtarget = repo.revs(b'max(parents(%ld) - (%ld))', tostrip, tostrip)
                      if newbmtarget:
                          newbmtarget = repo[newbmtarget.first()].node()
                      else:
                          newbmtarget = b'.'
                  return newbmtarget, updatebm
              def _createstripbackup(repo, stripbases, node, topic):
                  # backup the changeset we are about to strip
                  vfs = repo.vfs
                  unfi = repo.unfiltered()
                  to_node = unfi.changelog.node
                  # internal changeset are internal implementation details that should not
                  # leave the repository and not be exposed to the users. In addition feature
                  # using them requires to be resistant to strip. See test case for more
                  # details.
                  all_backup = unfi.revs(
                      b"(%ln)::(%ld) and not _internal()",
                      stripbases,
                      unfi.changelog.headrevs(),
                  )
                  if not all_backup:
                      return None
                  def to_nodes(revs):
                      return [to_node(r) for r in revs]
                  bases = to_nodes(unfi.revs("roots(%ld)", all_backup))
                  heads = to_nodes(unfi.revs("heads(%ld)", all_backup))
                  backupfile = backupbundle(repo, bases, heads, node, topic)
                  repo.ui.status(_(b"saved backup bundle to %s\n") % vfs.join(backupfile))
                  repo.ui.log(
                      b"backupbundle", b"saved backup bundle to %s\n", vfs.join(backupfile)
                  )
                  return backupfile
              def safestriproots(ui, repo, nodes):
                  """return list of roots of nodes where descendants are covered by nodes"""
                  torev = repo.unfiltered().changelog.rev
                  revs = {torev(n) for n in nodes}
                  # tostrip = wanted - unsafe = wanted - ancestors(orphaned)
                  # orphaned = affected - wanted
                  # affected = descendants(roots(wanted))
                  # wanted = revs
                  revset = b'%ld - ( ::( (roots(%ld):: and not _phase(%s)) -%ld) )'
                  tostrip = set(repo.revs(revset, revs, revs, phases.internal, revs))
                  notstrip = revs - tostrip
                  if notstrip:
                      nodestr = b', '.join(sorted(short(repo[n].node()) for n in notstrip))
                      ui.warn(
                          _(b'warning: orphaned descendants detected, not stripping %s\n')
                          % nodestr
                      )
                  return [c.node() for c in repo.set(b'roots(%ld)', tostrip)]
              class stripcallback:
                  """used as a transaction postclose callback"""
                  def __init__(self, ui, repo, backup, topic):
                      self.ui = ui
                      self.repo = repo
                      self.backup = backup
                      self.topic = topic or b'backup'
                      self.nodelist = []
                  def addnodes(self, nodes):
                      self.nodelist.extend(nodes)
                  def __call__(self, tr):
                      roots = safestriproots(self.ui, self.repo, self.nodelist)
                      if roots:
                          strip(self.ui, self.repo, roots, self.backup, self.topic)
              def delayedstrip(ui, repo, nodelist, topic=None, backup=True):
                  """like strip, but works inside transaction and won't strip irreverent revs
                  nodelist must explicitly contain all descendants. Otherwise a warning will
                  be printed that some nodes are not stripped.
                  Will do a backup if `backup` is True. The last non-None "topic" will be
                  used as the backup topic name. The default backup topic name is "backup".
                  """
                  tr = repo.currenttransaction()
                  if not tr:
                      nodes = safestriproots(ui, repo, nodelist)
                      return strip(ui, repo, nodes, backup=backup, topic=topic)
                  # transaction postclose callbacks are called in alphabet order.
                  # use '\xff' as prefix so we are likely to be called last.
                  callback = tr.getpostclose(b'\xffstrip')
                  if callback is None:
                      callback = stripcallback(ui, repo, backup=backup, topic=topic)
                      tr.addpostclose(b'\xffstrip', callback)
                  if topic:
                      callback.topic = topic
                  callback.addnodes(nodelist)
              def stripmanifest(repo, striprev, tr, files):
                  for revlog in manifestrevlogs(repo):
                      revlog.strip(striprev, tr)
              def manifestrevlogs(repo):
                  yield repo.manifestlog.getstorage(b'')
                  if scmutil.istreemanifest(repo):
                      # This logic is safe if treemanifest isn't enabled, but also
                      # pointless, so we skip it if treemanifest isn't enabled.
                      for entry in repo.store.datafiles():
                          if not entry.is_revlog:
                              continue
-                         if not entry.revlog_type == store.FILEFLAGS_MANIFESTLOG:
-                             continue
-                         if entry.is_revlog_main:
+                         if entry.revlog_type == store.FILEFLAGS_MANIFESTLOG:
                              yield repo.manifestlog.getstorage(entry.target_id)
              def rebuildfncache(ui, repo, only_data=False):
                  """Rebuilds the fncache file from repo history.
                  Missing entries will be added. Extra entries will be removed.
                  """
                  repo = repo.unfiltered()
                  if requirements.FNCACHE_REQUIREMENT not in repo.requirements:
                      ui.warn(
                          _(
                              b'(not rebuilding fncache because repository does not '
                              b'support fncache)\n'
                          )
                      )
                      return
                  with repo.lock():
                      fnc = repo.store.fncache
                      fnc.ensureloaded(warn=ui.warn)
                      oldentries = set(fnc.entries)
                      newentries = set()
                      seenfiles = set()
                      if only_data:
                          # Trust the listing of .i from the fncache, but not the .d. This is
                          # much faster, because we only need to stat every possible .d files,
                          # instead of reading the full changelog
                          for f in fnc:
                              if f[:5] == b'data/' and f[-2:] == b'.i':
                                  seenfiles.add(f[5:-2])
                                  newentries.add(f)
                                  dataf = f[:-2] + b'.d'
                                  if repo.store._exists(dataf):
                                      newentries.add(dataf)
                      else:
                          progress = ui.makeprogress(
                              _(b'rebuilding'), unit=_(b'changesets'), total=len(repo)
                          )
                          for rev in repo:
                              progress.update(rev)
                              ctx = repo[rev]
                              for f in ctx.files():
                                  # This is to minimize I/O.
                                  if f in seenfiles:
                                      continue
                                  seenfiles.add(f)
                                  i = b'data/%s.i' % f
                                  d = b'data/%s.d' % f
                                  if repo.store._exists(i):
                                      newentries.add(i)
                                  if repo.store._exists(d):
                                      newentries.add(d)
                          progress.complete()
                      if requirements.TREEMANIFEST_REQUIREMENT in repo.requirements:
                          # This logic is safe if treemanifest isn't enabled, but also
                          # pointless, so we skip it if treemanifest isn't enabled.
                          for dir in pathutil.dirs(seenfiles):
                              i = b'meta/%s/00manifest.i' % dir
                              d = b'meta/%s/00manifest.d' % dir
                              if repo.store._exists(i):
                                  newentries.add(i)
                              if repo.store._exists(d):
                                  newentries.add(d)
                      addcount = len(newentries - oldentries)
                      removecount = len(oldentries - newentries)
                      for p in sorted(oldentries - newentries):
                          ui.write(_(b'removing %s\n') % p)
                      for p in sorted(newentries - oldentries):
                          ui.write(_(b'adding %s\n') % p)
                      if addcount or removecount:
                          ui.write(
                              _(b'%d items added, %d removed from fncache\n')
                              % (addcount, removecount)
                          )
                          fnc.entries = newentries
                          fnc._dirty = True
                          with repo.transaction(b'fncache') as tr:
                              fnc.write(tr)
                      else:
                          ui.write(_(b'fncache already up to date\n'))
              def deleteobsmarkers(obsstore, indices):
                  """Delete some obsmarkers from obsstore and return how many were deleted
                  'indices' is a list of ints which are the indices
                  of the markers to be deleted.
                  Every invocation of this function completely rewrites the obsstore file,
                  skipping the markers we want to be removed. The new temporary file is
                  created, remaining markers are written there and on .close() this file
                  gets atomically renamed to obsstore, thus guaranteeing consistency."""
                  if not indices:
                      # we don't want to rewrite the obsstore with the same content
                      return
                  left = []
                  current = obsstore._all
                  n = 0
                  for i, m in enumerate(current):
                      if i in indices:
                          n += 1
                          continue
                      left.append(m)
                  newobsstorefile = obsstore.svfs(b'obsstore', b'w', atomictemp=True)
                  for bytes in obsolete.encodemarkers(left, True, obsstore._version):
                      newobsstorefile.write(bytes)
                  newobsstorefile.close()
                  return n

mercurial/revlogutils/rewrite.py

0 +1 -3

              # censor code related to censoring revision
              # coding: utf8
              #
              # Copyright 2021 Pierre-Yves David <pierre-yves.david@octobus.net>
              # Copyright 2015 Google, Inc <martinvonz@google.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              import binascii
              import contextlib
              import os
              import struct
              from ..node import (
                  nullrev,
              )
              from .constants import (
                  COMP_MODE_PLAIN,
                  ENTRY_DATA_COMPRESSED_LENGTH,
                  ENTRY_DATA_COMPRESSION_MODE,
                  ENTRY_DATA_OFFSET,
                  ENTRY_DATA_UNCOMPRESSED_LENGTH,
                  ENTRY_DELTA_BASE,
                  ENTRY_LINK_REV,
                  ENTRY_NODE_ID,
                  ENTRY_PARENT_1,
                  ENTRY_PARENT_2,
                  ENTRY_SIDEDATA_COMPRESSED_LENGTH,
                  ENTRY_SIDEDATA_COMPRESSION_MODE,
                  ENTRY_SIDEDATA_OFFSET,
                  REVIDX_ISCENSORED,
                  REVLOGV0,
                  REVLOGV1,
              )
              from ..i18n import _
              from .. import (
                  error,
                  mdiff,
                  pycompat,
                  revlogutils,
                  util,
              )
              from ..utils import (
                  storageutil,
              )
              from . import (
                  constants,
                  deltas,
              )
              def v1_censor(rl, tr, censornode, tombstone=b''):
                  """censors a revision in a "version 1" revlog"""
                  assert rl._format_version == constants.REVLOGV1, rl._format_version
                  # avoid cycle
                  from .. import revlog
                  censorrev = rl.rev(censornode)
                  tombstone = storageutil.packmeta({b'censored': tombstone}, b'')
                  # Rewriting the revlog in place is hard. Our strategy for censoring is
                  # to create a new revlog, copy all revisions to it, then replace the
                  # revlogs on transaction close.
                  #
                  # This is a bit dangerous. We could easily have a mismatch of state.
                  newrl = revlog.revlog(
                      rl.opener,
                      target=rl.target,
                      radix=rl.radix,
                      postfix=b'tmpcensored',
                      censorable=True,
                  )
                  newrl._format_version = rl._format_version
                  newrl._format_flags = rl._format_flags
                  newrl._generaldelta = rl._generaldelta
                  newrl._parse_index = rl._parse_index
                  for rev in rl.revs():
                      node = rl.node(rev)
                      p1, p2 = rl.parents(node)
                      if rev == censorrev:
                          newrl.addrawrevision(
                              tombstone,
                              tr,
                              rl.linkrev(censorrev),
                              p1,
                              p2,
                              censornode,
                              constants.REVIDX_ISCENSORED,
                          )
                          if newrl.deltaparent(rev) != nullrev:
                              m = _(b'censored revision stored as delta; cannot censor')
                              h = _(
                                  b'censoring of revlogs is not fully implemented;'
                                  b' please report this bug'
                              )
                              raise error.Abort(m, hint=h)
                          continue
                      if rl.iscensored(rev):
                          if rl.deltaparent(rev) != nullrev:
                              m = _(
                                  b'cannot censor due to censored '
                                  b'revision having delta stored'
                              )
                              raise error.Abort(m)
                          rawtext = rl._chunk(rev)
                      else:
                          rawtext = rl.rawdata(rev)
                      newrl.addrawrevision(
                          rawtext, tr, rl.linkrev(rev), p1, p2, node, rl.flags(rev)
                      )
                  tr.addbackup(rl._indexfile, location=b'store')
                  if not rl._inline:
                      tr.addbackup(rl._datafile, location=b'store')
                  rl.opener.rename(newrl._indexfile, rl._indexfile)
                  if not rl._inline:
                      rl.opener.rename(newrl._datafile, rl._datafile)
                  rl.clearcaches()
                  rl._loadindex()
              def v2_censor(revlog, tr, censornode, tombstone=b''):
                  """censors a revision in a "version 2" revlog"""
                  assert revlog._format_version != REVLOGV0, revlog._format_version
                  assert revlog._format_version != REVLOGV1, revlog._format_version
                  censor_revs = {revlog.rev(censornode)}
                  _rewrite_v2(revlog, tr, censor_revs, tombstone)
              def _rewrite_v2(revlog, tr, censor_revs, tombstone=b''):
                  """rewrite a revlog to censor some of its content
                  General principle
                  We create new revlog files (index/data/sidedata) to copy the content of
                  the existing data without the censored data.
                  We need to recompute new delta for any revision that used the censored
                  revision as delta base. As the cumulative size of the new delta may be
                  large, we store them in a temporary file until they are stored in their
                  final destination.
                  All data before the censored data can be blindly copied. The rest needs
                  to be copied as we go and the associated index entry needs adjustement.
                  """
                  assert revlog._format_version != REVLOGV0, revlog._format_version
                  assert revlog._format_version != REVLOGV1, revlog._format_version
                  old_index = revlog.index
                  docket = revlog._docket
                  tombstone = storageutil.packmeta({b'censored': tombstone}, b'')
                  first_excl_rev = min(censor_revs)
                  first_excl_entry = revlog.index[first_excl_rev]
                  index_cutoff = revlog.index.entry_size * first_excl_rev
                  data_cutoff = first_excl_entry[ENTRY_DATA_OFFSET] >> 16
                  sidedata_cutoff = revlog.sidedata_cut_off(first_excl_rev)
                  with pycompat.unnamedtempfile(mode=b"w+b") as tmp_storage:
                      # rev → (new_base, data_start, data_end, compression_mode)
                      rewritten_entries = _precompute_rewritten_delta(
                          revlog,
                          old_index,
                          censor_revs,
                          tmp_storage,
                      )
                      all_files = _setup_new_files(
                          revlog,
                          index_cutoff,
                          data_cutoff,
                          sidedata_cutoff,
                      )
                      # we dont need to open the old index file since its content already
                      # exist in a usable form in `old_index`.
                      with all_files() as open_files:
                          (
                              old_data_file,
                              old_sidedata_file,
                              new_index_file,
                              new_data_file,
                              new_sidedata_file,
                          ) = open_files
                          # writing the censored revision
                          # Writing all subsequent revisions
                          for rev in range(first_excl_rev, len(old_index)):
                              if rev in censor_revs:
                                  _rewrite_censor(
                                      revlog,
                                      old_index,
                                      open_files,
                                      rev,
                                      tombstone,
                                  )
                              else:
                                  _rewrite_simple(
                                      revlog,
                                      old_index,
                                      open_files,
                                      rev,
                                      rewritten_entries,
                                      tmp_storage,
                                  )
                  docket.write(transaction=None, stripping=True)
              def _precompute_rewritten_delta(
                  revlog,
                  old_index,
                  excluded_revs,
                  tmp_storage,
              ):
                  """Compute new delta for revisions whose delta is based on revision that
                  will not survive as is.
                  Return a mapping: {rev → (new_base, data_start, data_end, compression_mode)}
                  """
                  dc = deltas.deltacomputer(revlog)
                  rewritten_entries = {}
                  first_excl_rev = min(excluded_revs)
                  with revlog._segmentfile._open_read() as dfh:
                      for rev in range(first_excl_rev, len(old_index)):
                          if rev in excluded_revs:
                              # this revision will be preserved as is, so we don't need to
                              # consider recomputing a delta.
                              continue
                          entry = old_index[rev]
                          if entry[ENTRY_DELTA_BASE] not in excluded_revs:
                              continue
                          # This is a revision that use the censored revision as the base
                          # for its delta. We need a need new deltas
                          if entry[ENTRY_DATA_UNCOMPRESSED_LENGTH] == 0:
                              # this revision is empty, we can delta against nullrev
                              rewritten_entries[rev] = (nullrev, 0, 0, COMP_MODE_PLAIN)
                          else:
                              text = revlog.rawdata(rev, _df=dfh)
                              info = revlogutils.revisioninfo(
                                  node=entry[ENTRY_NODE_ID],
                                  p1=revlog.node(entry[ENTRY_PARENT_1]),
                                  p2=revlog.node(entry[ENTRY_PARENT_2]),
                                  btext=[text],
                                  textlen=len(text),
                                  cachedelta=None,
                                  flags=entry[ENTRY_DATA_OFFSET] & 0xFFFF,
                              )
                              d = dc.finddeltainfo(
                                  info, dfh, excluded_bases=excluded_revs, target_rev=rev
                              )
                              default_comp = revlog._docket.default_compression_header
                              comp_mode, d = deltas.delta_compression(default_comp, d)
                              # using `tell` is a bit lazy, but we are not here for speed
                              start = tmp_storage.tell()
                              tmp_storage.write(d.data[1])
                              end = tmp_storage.tell()
                              rewritten_entries[rev] = (d.base, start, end, comp_mode)
                  return rewritten_entries
              def _setup_new_files(
                  revlog,
                  index_cutoff,
                  data_cutoff,
                  sidedata_cutoff,
              ):
                  """
                  return a context manager to open all the relevant files:
                  - old_data_file,
                  - old_sidedata_file,
                  - new_index_file,
                  - new_data_file,
                  - new_sidedata_file,
                  The old_index_file is not here because it is accessed through the
                  `old_index` object if the caller function.
                  """
                  docket = revlog._docket
                  old_index_filepath = revlog.opener.join(docket.index_filepath())
                  old_data_filepath = revlog.opener.join(docket.data_filepath())
                  old_sidedata_filepath = revlog.opener.join(docket.sidedata_filepath())
                  new_index_filepath = revlog.opener.join(docket.new_index_file())
                  new_data_filepath = revlog.opener.join(docket.new_data_file())
                  new_sidedata_filepath = revlog.opener.join(docket.new_sidedata_file())
                  util.copyfile(old_index_filepath, new_index_filepath, nb_bytes=index_cutoff)
                  util.copyfile(old_data_filepath, new_data_filepath, nb_bytes=data_cutoff)
                  util.copyfile(
                      old_sidedata_filepath,
                      new_sidedata_filepath,
                      nb_bytes=sidedata_cutoff,
                  )
                  revlog.opener.register_file(docket.index_filepath())
                  revlog.opener.register_file(docket.data_filepath())
                  revlog.opener.register_file(docket.sidedata_filepath())
                  docket.index_end = index_cutoff
                  docket.data_end = data_cutoff
                  docket.sidedata_end = sidedata_cutoff
                  # reload the revlog internal information
                  revlog.clearcaches()
                  revlog._loadindex(docket=docket)
                  @contextlib.contextmanager
                  def all_files_opener():
                      # hide opening in an helper function to please check-code, black
                      # and various python version at the same time
                      with open(old_data_filepath, 'rb') as old_data_file:
                          with open(old_sidedata_filepath, 'rb') as old_sidedata_file:
                              with open(new_index_filepath, 'r+b') as new_index_file:
                                  with open(new_data_filepath, 'r+b') as new_data_file:
                                      with open(
                                          new_sidedata_filepath, 'r+b'
                                      ) as new_sidedata_file:
                                          new_index_file.seek(0, os.SEEK_END)
                                          assert new_index_file.tell() == index_cutoff
                                          new_data_file.seek(0, os.SEEK_END)
                                          assert new_data_file.tell() == data_cutoff
                                          new_sidedata_file.seek(0, os.SEEK_END)
                                          assert new_sidedata_file.tell() == sidedata_cutoff
                                          yield (
                                              old_data_file,
                                              old_sidedata_file,
                                              new_index_file,
                                              new_data_file,
                                              new_sidedata_file,
                                          )
                  return all_files_opener
              def _rewrite_simple(
                  revlog,
                  old_index,
                  all_files,
                  rev,
                  rewritten_entries,
                  tmp_storage,
              ):
                  """append a normal revision to the index after the rewritten one(s)"""
                  (
                      old_data_file,
                      old_sidedata_file,
                      new_index_file,
                      new_data_file,
                      new_sidedata_file,
                  ) = all_files
                  entry = old_index[rev]
                  flags = entry[ENTRY_DATA_OFFSET] & 0xFFFF
                  old_data_offset = entry[ENTRY_DATA_OFFSET] >> 16
                  if rev not in rewritten_entries:
                      old_data_file.seek(old_data_offset)
                      new_data_size = entry[ENTRY_DATA_COMPRESSED_LENGTH]
                      new_data = old_data_file.read(new_data_size)
                      data_delta_base = entry[ENTRY_DELTA_BASE]
                      d_comp_mode = entry[ENTRY_DATA_COMPRESSION_MODE]
                  else:
                      (
                          data_delta_base,
                          start,
                          end,
                          d_comp_mode,
                      ) = rewritten_entries[rev]
                      new_data_size = end - start
                      tmp_storage.seek(start)
                      new_data = tmp_storage.read(new_data_size)
                  # It might be faster to group continuous read/write operation,
                  # however, this is censor, an operation that is not focussed
                  # around stellar performance. So I have not written this
                  # optimisation yet.
                  new_data_offset = new_data_file.tell()
                  new_data_file.write(new_data)
                  sidedata_size = entry[ENTRY_SIDEDATA_COMPRESSED_LENGTH]
                  new_sidedata_offset = new_sidedata_file.tell()
                  if 0 < sidedata_size:
                      old_sidedata_offset = entry[ENTRY_SIDEDATA_OFFSET]
                      old_sidedata_file.seek(old_sidedata_offset)
                      new_sidedata = old_sidedata_file.read(sidedata_size)
                      new_sidedata_file.write(new_sidedata)
                  data_uncompressed_length = entry[ENTRY_DATA_UNCOMPRESSED_LENGTH]
                  sd_com_mode = entry[ENTRY_SIDEDATA_COMPRESSION_MODE]
                  assert data_delta_base <= rev, (data_delta_base, rev)
                  new_entry = revlogutils.entry(
                      flags=flags,
                      data_offset=new_data_offset,
                      data_compressed_length=new_data_size,
                      data_uncompressed_length=data_uncompressed_length,
                      data_delta_base=data_delta_base,
                      link_rev=entry[ENTRY_LINK_REV],
                      parent_rev_1=entry[ENTRY_PARENT_1],
                      parent_rev_2=entry[ENTRY_PARENT_2],
                      node_id=entry[ENTRY_NODE_ID],
                      sidedata_offset=new_sidedata_offset,
                      sidedata_compressed_length=sidedata_size,
                      data_compression_mode=d_comp_mode,
                      sidedata_compression_mode=sd_com_mode,
                  )
                  revlog.index.append(new_entry)
                  entry_bin = revlog.index.entry_binary(rev)
                  new_index_file.write(entry_bin)
                  revlog._docket.index_end = new_index_file.tell()
                  revlog._docket.data_end = new_data_file.tell()
                  revlog._docket.sidedata_end = new_sidedata_file.tell()
              def _rewrite_censor(
                  revlog,
                  old_index,
                  all_files,
                  rev,
                  tombstone,
              ):
                  """rewrite and append a censored revision"""
                  (
                      old_data_file,
                      old_sidedata_file,
                      new_index_file,
                      new_data_file,
                      new_sidedata_file,
                  ) = all_files
                  entry = old_index[rev]
                  # XXX consider trying the default compression too
                  new_data_size = len(tombstone)
                  new_data_offset = new_data_file.tell()
                  new_data_file.write(tombstone)
                  # we are not adding any sidedata as they might leak info about the censored version
                  link_rev = entry[ENTRY_LINK_REV]
                  p1 = entry[ENTRY_PARENT_1]
                  p2 = entry[ENTRY_PARENT_2]
                  new_entry = revlogutils.entry(
                      flags=constants.REVIDX_ISCENSORED,
                      data_offset=new_data_offset,
                      data_compressed_length=new_data_size,
                      data_uncompressed_length=new_data_size,
                      data_delta_base=rev,
                      link_rev=link_rev,
                      parent_rev_1=p1,
                      parent_rev_2=p2,
                      node_id=entry[ENTRY_NODE_ID],
                      sidedata_offset=0,
                      sidedata_compressed_length=0,
                      data_compression_mode=COMP_MODE_PLAIN,
                      sidedata_compression_mode=COMP_MODE_PLAIN,
                  )
                  revlog.index.append(new_entry)
                  entry_bin = revlog.index.entry_binary(rev)
                  new_index_file.write(entry_bin)
                  revlog._docket.index_end = new_index_file.tell()
                  revlog._docket.data_end = new_data_file.tell()
              def _get_filename_from_filelog_index(path):
                  # Drop the extension and the `data/` prefix
                  path_part = path.rsplit(b'.', 1)[0].split(b'/', 1)
                  if len(path_part) < 2:
                      msg = _(b"cannot recognize filelog from filename: '%s'")
                      msg %= path
                      raise error.Abort(msg)
                  return path_part[1]
              def _filelog_from_filename(repo, path):
                  """Returns the filelog for the given `path`. Stolen from `engine.py`"""
                  from .. import filelog  # avoid cycle
                  fl = filelog.filelog(repo.svfs, path)
                  return fl
              def _write_swapped_parents(repo, rl, rev, offset, fp):
                  """Swaps p1 and p2 and overwrites the revlog entry for `rev` in `fp`"""
                  from ..pure import parsers  # avoid cycle
                  if repo._currentlock(repo._lockref) is None:
                      # Let's be paranoid about it
                      msg = "repo needs to be locked to rewrite parents"
                      raise error.ProgrammingError(msg)
                  index_format = parsers.IndexObject.index_format
                  entry = rl.index[rev]
                  new_entry = list(entry)
                  new_entry[5], new_entry[6] = entry[6], entry[5]
                  packed = index_format.pack(*new_entry[:8])
                  fp.seek(offset)
                  fp.write(packed)
              def _reorder_filelog_parents(repo, fl, to_fix):
                  """
                  Swaps p1 and p2 for all `to_fix` revisions of filelog `fl` and writes the
                  new version to disk, overwriting the old one with a rename.
                  """
                  from ..pure import parsers  # avoid cycle
                  ui = repo.ui
                  assert len(to_fix) > 0
                  rl = fl._revlog
                  if rl._format_version != constants.REVLOGV1:
                      msg = "expected version 1 revlog, got version '%d'" % rl._format_version
                      raise error.ProgrammingError(msg)
                  index_file = rl._indexfile
                  new_file_path = index_file + b'.tmp-parents-fix'
                  repaired_msg = _(b"repaired revision %d of 'filelog %s'\n")
                  with ui.uninterruptible():
                      try:
                          util.copyfile(
                              rl.opener.join(index_file),
                              rl.opener.join(new_file_path),
                              checkambig=rl._checkambig,
                          )
                          with rl.opener(new_file_path, mode=b"r+") as fp:
                              if rl._inline:
                                  index = parsers.InlinedIndexObject(fp.read())
                                  for rev in fl.revs():
                                      if rev in to_fix:
                                          offset = index._calculate_index(rev)
                                          _write_swapped_parents(repo, rl, rev, offset, fp)
                                          ui.write(repaired_msg % (rev, index_file))
                              else:
                                  index_format = parsers.IndexObject.index_format
                                  for rev in to_fix:
                                      offset = rev * index_format.size
                                      _write_swapped_parents(repo, rl, rev, offset, fp)
                                      ui.write(repaired_msg % (rev, index_file))
                          rl.opener.rename(new_file_path, index_file)
                          rl.clearcaches()
                          rl._loadindex()
                      finally:
                          util.tryunlink(new_file_path)
              def _is_revision_affected(fl, filerev, metadata_cache=None):
                  full_text = lambda: fl._revlog.rawdata(filerev)
                  parent_revs = lambda: fl._revlog.parentrevs(filerev)
                  return _is_revision_affected_inner(
                      full_text, parent_revs, filerev, metadata_cache
                  )
              def _is_revision_affected_inner(
                  full_text,
                  parents_revs,
                  filerev,
                  metadata_cache=None,
              ):
                  """Mercurial currently (5.9rc0) uses `p1 == nullrev and p2 != nullrev` as a
                  special meaning compared to the reverse in the context of filelog-based
                  copytracing. issue6528 exists because new code assumed that parent ordering
                  didn't matter, so this detects if the revision contains metadata (since
                  it's only used for filelog-based copytracing) and its parents are in the
                  "wrong" order."""
                  try:
                      raw_text = full_text()
                  except error.CensoredNodeError:
                      # We don't care about censored nodes as they never carry metadata
                      return False
                  # raw text can be a `memoryview`, which doesn't implement `startswith`
                  has_meta = bytes(raw_text[:2]) == b'\x01\n'
                  if metadata_cache is not None:
                      metadata_cache[filerev] = has_meta
                  if has_meta:
                      (p1, p2) = parents_revs()
                      if p1 != nullrev and p2 == nullrev:
                          return True
                  return False
              def _is_revision_affected_fast(repo, fl, filerev, metadata_cache):
                  rl = fl._revlog
                  is_censored = lambda: rl.iscensored(filerev)
                  delta_base = lambda: rl.deltaparent(filerev)
                  delta = lambda: rl._chunk(filerev)
                  full_text = lambda: rl.rawdata(filerev)
                  parent_revs = lambda: rl.parentrevs(filerev)
                  return _is_revision_affected_fast_inner(
                      is_censored,
                      delta_base,
                      delta,
                      full_text,
                      parent_revs,
                      filerev,
                      metadata_cache,
                  )
              def _is_revision_affected_fast_inner(
                  is_censored,
                  delta_base,
                  delta,
                  full_text,
                  parent_revs,
                  filerev,
                  metadata_cache,
              ):
                  """Optimization fast-path for `_is_revision_affected`.
                  `metadata_cache` is a dict of `{rev: has_metadata}` which allows any
                  revision to check if its base has metadata, saving computation of the full
                  text, instead looking at the current delta.
                  This optimization only works if the revisions are looked at in order."""
                  if is_censored():
                      # Censored revisions don't contain metadata, so they cannot be affected
                      metadata_cache[filerev] = False
                      return False
                  p1, p2 = parent_revs()
                  if p1 == nullrev or p2 != nullrev:
                      return False
                  delta_parent = delta_base()
                  parent_has_metadata = metadata_cache.get(delta_parent)
                  if parent_has_metadata is None:
                      return _is_revision_affected_inner(
                          full_text,
                          parent_revs,
                          filerev,
                          metadata_cache,
                      )
                  chunk = delta()
                  if not len(chunk):
                      # No diff for this revision
                      return parent_has_metadata
                  header_length = 12
                  if len(chunk) < header_length:
                      raise error.Abort(_(b"patch cannot be decoded"))
                  start, _end, _length = struct.unpack(b">lll", chunk[:header_length])
                  if start < 2:  # len(b'\x01\n') == 2
                      # This delta does *something* to the metadata marker (if any).
                      # Check it the slow way
                      is_affected = _is_revision_affected_inner(
                          full_text,
                          parent_revs,
                          filerev,
                          metadata_cache,
                      )
                      return is_affected
                  # The diff did not remove or add the metadata header, it's then in the same
                  # situation as its parent
                  metadata_cache[filerev] = parent_has_metadata
                  return parent_has_metadata
              def _from_report(ui, repo, context, from_report, dry_run):
                  """
                  Fix the revisions given in the `from_report` file, but still checks if the
                  revisions are indeed affected to prevent an unfortunate cyclic situation
                  where we'd swap well-ordered parents again.
                  See the doc for `debug_fix_issue6528` for the format documentation.
                  """
                  ui.write(_(b"loading report file '%s'\n") % from_report)
                  with context(), open(from_report, mode='rb') as f:
                      for line in f.read().split(b'\n'):
                          if not line:
                              continue
                          filenodes, filename = line.split(b' ', 1)
                          fl = _filelog_from_filename(repo, filename)
                          to_fix = set(
                              fl.rev(binascii.unhexlify(n)) for n in filenodes.split(b',')
                          )
                          excluded = set()
                          for filerev in to_fix:
                              if _is_revision_affected(fl, filerev):
                                  msg = b"found affected revision %d for filelog '%s'\n"
                                  ui.warn(msg % (filerev, filename))
                              else:
                                  msg = _(b"revision %s of file '%s' is not affected\n")
                                  msg %= (binascii.hexlify(fl.node(filerev)), filename)
                                  ui.warn(msg)
                                  excluded.add(filerev)
                          to_fix = to_fix - excluded
                          if not to_fix:
                              msg = _(b"no affected revisions were found for '%s'\n")
                              ui.write(msg % filename)
                              continue
                          if not dry_run:
                              _reorder_filelog_parents(repo, fl, sorted(to_fix))
              def filter_delta_issue6528(revlog, deltas_iter):
                  """filter incomind deltas to repaire issue 6528 on the fly"""
                  metadata_cache = {}
                  deltacomputer = deltas.deltacomputer(revlog)
                  for rev, d in enumerate(deltas_iter, len(revlog)):
                      (
                          node,
                          p1_node,
                          p2_node,
                          linknode,
                          deltabase,
                          delta,
                          flags,
                          sidedata,
                      ) = d
                      if not revlog.index.has_node(deltabase):
                          raise error.LookupError(
                              deltabase, revlog.radix, _(b'unknown parent')
                          )
                      base_rev = revlog.rev(deltabase)
                      if not revlog.index.has_node(p1_node):
                          raise error.LookupError(p1_node, revlog.radix, _(b'unknown parent'))
                      p1_rev = revlog.rev(p1_node)
                      if not revlog.index.has_node(p2_node):
                          raise error.LookupError(p2_node, revlog.radix, _(b'unknown parent'))
                      p2_rev = revlog.rev(p2_node)
                      is_censored = lambda: bool(flags & REVIDX_ISCENSORED)
                      delta_base = lambda: revlog.rev(delta_base)
                      delta_base = lambda: base_rev
                      parent_revs = lambda: (p1_rev, p2_rev)
                      def full_text():
                          # note: being able to reuse the full text computation in the
                          # underlying addrevision would be useful however this is a bit too
                          # intrusive the for the "quick" issue6528 we are writing before the
                          # 5.8 release
                          textlen = mdiff.patchedsize(revlog.size(base_rev), delta)
                          revinfo = revlogutils.revisioninfo(
                              node,
                              p1_node,
                              p2_node,
                              [None],
                              textlen,
                              (base_rev, delta),
                              flags,
                          )
                          # cached by the global "writing" context
                          assert revlog._writinghandles is not None
                          if revlog._inline:
                              fh = revlog._writinghandles[0]
                          else:
                              fh = revlog._writinghandles[1]
                          return deltacomputer.buildtext(revinfo, fh)
                      is_affected = _is_revision_affected_fast_inner(
                          is_censored,
                          delta_base,
                          lambda: delta,
                          full_text,
                          parent_revs,
                          rev,
                          metadata_cache,
                      )
                      if is_affected:
                          d = (
                              node,
                              p2_node,
                              p1_node,
                              linknode,
                              deltabase,
                              delta,
                              flags,
                              sidedata,
                          )
                      yield d
              def repair_issue6528(
                  ui, repo, dry_run=False, to_report=None, from_report=None, paranoid=False
              ):
                  from .. import store  # avoid cycle
                  @contextlib.contextmanager
                  def context():
                      if dry_run or to_report:  # No need for locking
                          yield
                      else:
                          with repo.wlock(), repo.lock():
                              yield
                  if from_report:
                      return _from_report(ui, repo, context, from_report, dry_run)
                  report_entries = []
                  with context():
                      files = list(
                          entry
                          for entry in repo.store.datafiles()
                          if (
-                             entry.is_revlog
-                             and entry.is_revlog_main
-                             and entry.revlog_type == store.FILEFLAGS_FILELOG
+                             entry.is_revlog and entry.revlog_type == store.FILEFLAGS_FILELOG
                          )
                      )
                      progress = ui.makeprogress(
                          _(b"looking for affected revisions"),
                          unit=_(b"filelogs"),
                          total=len(files),
                      )
                      found_nothing = True
                      for entry in files:
                          progress.increment()
                          filename = entry.target_id
                          fl = _filelog_from_filename(repo, entry.target_id)
                          # Set of filerevs (or hex filenodes if `to_report`) that need fixing
                          to_fix = set()
                          metadata_cache = {}
                          for filerev in fl.revs():
                              affected = _is_revision_affected_fast(
                                  repo, fl, filerev, metadata_cache
                              )
                              if paranoid:
                                  slow = _is_revision_affected(fl, filerev)
                                  if slow != affected:
                                      msg = _(b"paranoid check failed for '%s' at node %s")
                                      node = binascii.hexlify(fl.node(filerev))
                                      raise error.Abort(msg % (filename, node))
                              if affected:
                                  msg = b"found affected revision %d for file '%s'\n"
                                  ui.warn(msg % (filerev, filename))
                                  found_nothing = False
                                  if not dry_run:
                                      if to_report:
                                          to_fix.add(binascii.hexlify(fl.node(filerev)))
                                      else:
                                          to_fix.add(filerev)
                          if to_fix:
                              to_fix = sorted(to_fix)
                              if to_report:
                                  report_entries.append((filename, to_fix))
                              else:
                                  _reorder_filelog_parents(repo, fl, to_fix)
                      if found_nothing:
                          ui.write(_(b"no affected revisions were found\n"))
                      if to_report and report_entries:
                          with open(to_report, mode="wb") as f:
                              for path, to_fix in report_entries:
                                  f.write(b"%s %s\n" % (b",".join(to_fix), path))
                      progress.complete()

mercurial/store.py

0 +50 -39

              # store.py - repository store handling for Mercurial
              #
              # Copyright 2008 Olivia Mackall <olivia@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              import collections
              import functools
              import os
              import re
              import stat
              from typing import Generator
              from .i18n import _
              from .pycompat import getattr
              from .thirdparty import attr
              from .node import hex
              from . import (
                  changelog,
                  error,
                  manifest,
                  policy,
                  pycompat,
                  util,
                  vfs as vfsmod,
              )
              from .utils import hashutil
              parsers = policy.importmod('parsers')
              # how much bytes should be read from fncache in one read
              # It is done to prevent loading large fncache files into memory
              fncache_chunksize = 10 ** 6
              def _match_tracked_entry(entry, matcher):
                  """parses a fncache entry and returns whether the entry is tracking a path
                  matched by matcher or not.
                  If matcher is None, returns True"""
                  if matcher is None:
                      return True
                  if entry.revlog_type == FILEFLAGS_FILELOG:
                      return matcher(entry.target_id)
                  elif entry.revlog_type == FILEFLAGS_MANIFESTLOG:
                      return matcher.visitdir(entry.target_id.rstrip(b'/'))
                  raise error.ProgrammingError(b"cannot process entry %r" % entry)
              # This avoids a collision between a file named foo and a dir named
              # foo.i or foo.d
              def _encodedir(path):
                  """
                  >>> _encodedir(b'data/foo.i')
                  'data/foo.i'
                  >>> _encodedir(b'data/foo.i/bla.i')
                  'data/foo.i.hg/bla.i'
                  >>> _encodedir(b'data/foo.i.hg/bla.i')
                  'data/foo.i.hg.hg/bla.i'
                  >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
                  'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
                  """
                  return (
                      path.replace(b".hg/", b".hg.hg/")
                      .replace(b".i/", b".i.hg/")
                      .replace(b".d/", b".d.hg/")
                  )
              encodedir = getattr(parsers, 'encodedir', _encodedir)
              def decodedir(path):
                  """
                  >>> decodedir(b'data/foo.i')
                  'data/foo.i'
                  >>> decodedir(b'data/foo.i.hg/bla.i')
                  'data/foo.i/bla.i'
                  >>> decodedir(b'data/foo.i.hg.hg/bla.i')
                  'data/foo.i.hg/bla.i'
                  """
                  if b".hg/" not in path:
                      return path
                  return (
                      path.replace(b".d.hg/", b".d/")
                      .replace(b".i.hg/", b".i/")
                      .replace(b".hg.hg/", b".hg/")
                  )
              def _reserved():
                  """characters that are problematic for filesystems
                  * ascii escapes (0..31)
                  * ascii hi (126..255)
                  * windows specials
                  these characters will be escaped by encodefunctions
                  """
                  winreserved = [ord(x) for x in u'\\:*?"<>|']
                  for x in range(32):
                      yield x
                  for x in range(126, 256):
                      yield x
                  for x in winreserved:
                      yield x
              def _buildencodefun():
                  """
                  >>> enc, dec = _buildencodefun()
                  >>> enc(b'nothing/special.txt')
                  'nothing/special.txt'
                  >>> dec(b'nothing/special.txt')
                  'nothing/special.txt'
                  >>> enc(b'HELLO')
                  '_h_e_l_l_o'
                  >>> dec(b'_h_e_l_l_o')
                  'HELLO'
                  >>> enc(b'hello:world?')
                  'hello~3aworld~3f'
                  >>> dec(b'hello~3aworld~3f')
                  'hello:world?'
                  >>> enc(b'the\\x07quick\\xADshot')
                  'the~07quick~adshot'
                  >>> dec(b'the~07quick~adshot')
                  'the\\x07quick\\xadshot'
                  """
                  e = b'_'
                  xchr = pycompat.bytechr
                  asciistr = list(map(xchr, range(127)))
                  capitals = list(range(ord(b"A"), ord(b"Z") + 1))
                  cmap = {x: x for x in asciistr}
                  for x in _reserved():
                      cmap[xchr(x)] = b"~%02x" % x
                  for x in capitals + [ord(e)]:
                      cmap[xchr(x)] = e + xchr(x).lower()
                  dmap = {}
                  for k, v in cmap.items():
                      dmap[v] = k
                  def decode(s):
                      i = 0
                      while i < len(s):
                          for l in range(1, 4):
                              try:
                                  yield dmap[s[i : i + l]]
                                  i += l
                                  break
                              except KeyError:
                                  pass
                          else:
                              raise KeyError
                  return (
                      lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),
                      lambda s: b''.join(list(decode(s))),
                  )
              _encodefname, _decodefname = _buildencodefun()
              def encodefilename(s):
                  """
                  >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
                  'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
                  """
                  return _encodefname(encodedir(s))
              def decodefilename(s):
                  """
                  >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
                  'foo.i/bar.d/bla.hg/hi:world?/HELLO'
                  """
                  return decodedir(_decodefname(s))
              def _buildlowerencodefun():
                  """
                  >>> f = _buildlowerencodefun()
                  >>> f(b'nothing/special.txt')
                  'nothing/special.txt'
                  >>> f(b'HELLO')
                  'hello'
                  >>> f(b'hello:world?')
                  'hello~3aworld~3f'
                  >>> f(b'the\\x07quick\\xADshot')
                  'the~07quick~adshot'
                  """
                  xchr = pycompat.bytechr
                  cmap = {xchr(x): xchr(x) for x in range(127)}
                  for x in _reserved():
                      cmap[xchr(x)] = b"~%02x" % x
                  for x in range(ord(b"A"), ord(b"Z") + 1):
                      cmap[xchr(x)] = xchr(x).lower()
                  def lowerencode(s):
                      return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
                  return lowerencode
              lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
              # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
              _winres3 = (b'aux', b'con', b'prn', b'nul')  # length 3
              _winres4 = (b'com', b'lpt')  # length 4 (with trailing 1..9)
              def _auxencode(path, dotencode):
                  """
                  Encodes filenames containing names reserved by Windows or which end in
                  period or space. Does not touch other single reserved characters c.
                  Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
                  Additionally encodes space or period at the beginning, if dotencode is
                  True. Parameter path is assumed to be all lowercase.
                  A segment only needs encoding if a reserved name appears as a
                  basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
                  doesn't need encoding.
                  >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
                  >>> _auxencode(s.split(b'/'), True)
                  ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
                  >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
                  >>> _auxencode(s.split(b'/'), False)
                  ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
                  >>> _auxencode([b'foo. '], True)
                  ['foo.~20']
                  >>> _auxencode([b' .foo'], True)
                  ['~20.foo']
                  """
                  for i, n in enumerate(path):
                      if not n:
                          continue
                      if dotencode and n[0] in b'. ':
                          n = b"~%02x" % ord(n[0:1]) + n[1:]
                          path[i] = n
                      else:
                          l = n.find(b'.')
                          if l == -1:
                              l = len(n)
                          if (l == 3 and n[:3] in _winres3) or (
                              l == 4
                              and n[3:4] <= b'9'
                              and n[3:4] >= b'1'
                              and n[:3] in _winres4
                          ):
                              # encode third letter ('aux' -> 'au~78')
                              ec = b"~%02x" % ord(n[2:3])
                              n = n[0:2] + ec + n[3:]
                              path[i] = n
                      if n[-1] in b'. ':
                          # encode last period or space ('foo...' -> 'foo..~2e')
                          path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
                  return path
              _maxstorepathlen = 120
              _dirprefixlen = 8
              _maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
              def _hashencode(path, dotencode):
                  digest = hex(hashutil.sha1(path).digest())
                  le = lowerencode(path[5:]).split(b'/')  # skips prefix 'data/' or 'meta/'
                  parts = _auxencode(le, dotencode)
                  basename = parts[-1]
                  _root, ext = os.path.splitext(basename)
                  sdirs = []
                  sdirslen = 0
                  for p in parts[:-1]:
                      d = p[:_dirprefixlen]
                      if d[-1] in b'. ':
                          # Windows can't access dirs ending in period or space
                          d = d[:-1] + b'_'
                      if sdirslen == 0:
                          t = len(d)
                      else:
                          t = sdirslen + 1 + len(d)
                          if t > _maxshortdirslen:
                              break
                      sdirs.append(d)
                      sdirslen = t
                  dirs = b'/'.join(sdirs)
                  if len(dirs) > 0:
                      dirs += b'/'
                  res = b'dh/' + dirs + digest + ext
                  spaceleft = _maxstorepathlen - len(res)
                  if spaceleft > 0:
                      filler = basename[:spaceleft]
                      res = b'dh/' + dirs + filler + digest + ext
                  return res
              def _hybridencode(path, dotencode):
                  """encodes path with a length limit
                  Encodes all paths that begin with 'data/', according to the following.
                  Default encoding (reversible):
                  Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
                  characters are encoded as '~xx', where xx is the two digit hex code
                  of the character (see encodefilename).
                  Relevant path components consisting of Windows reserved filenames are
                  masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
                  Hashed encoding (not reversible):
                  If the default-encoded path is longer than _maxstorepathlen, a
                  non-reversible hybrid hashing of the path is done instead.
                  This encoding uses up to _dirprefixlen characters of all directory
                  levels of the lowerencoded path, but not more levels than can fit into
                  _maxshortdirslen.
                  Then follows the filler followed by the sha digest of the full path.
                  The filler is the beginning of the basename of the lowerencoded path
                  (the basename is everything after the last path separator). The filler
                  is as long as possible, filling in characters from the basename until
                  the encoded path has _maxstorepathlen characters (or all chars of the
                  basename have been taken).
                  The extension (e.g. '.i' or '.d') is preserved.
                  The string 'data/' at the beginning is replaced with 'dh/', if the hashed
                  encoding was used.
                  """
                  path = encodedir(path)
                  ef = _encodefname(path).split(b'/')
                  res = b'/'.join(_auxencode(ef, dotencode))
                  if len(res) > _maxstorepathlen:
                      res = _hashencode(path, dotencode)
                  return res
              def _pathencode(path):
                  de = encodedir(path)
                  if len(path) > _maxstorepathlen:
                      return _hashencode(de, True)
                  ef = _encodefname(de).split(b'/')
                  res = b'/'.join(_auxencode(ef, True))
                  if len(res) > _maxstorepathlen:
                      return _hashencode(de, True)
                  return res
              _pathencode = getattr(parsers, 'pathencode', _pathencode)
              def _plainhybridencode(f):
                  return _hybridencode(f, False)
              def _calcmode(vfs):
                  try:
                      # files in .hg/ will be created using this mode
                      mode = vfs.stat().st_mode
                      # avoid some useless chmods
                      if (0o777 & ~util.umask) == (0o777 & mode):
                          mode = None
                  except OSError:
                      mode = None
                  return mode
              _data = [
                  b'bookmarks',
                  b'narrowspec',
                  b'data',
                  b'meta',
                  b'00manifest.d',
                  b'00manifest.i',
                  b'00changelog.d',
                  b'00changelog.i',
                  b'phaseroots',
                  b'obsstore',
                  b'requires',
              ]
              REVLOG_FILES_MAIN_EXT = (b'.i',)
              REVLOG_FILES_OTHER_EXT = (
                  b'.idx',
                  b'.d',
                  b'.dat',
                  b'.n',
                  b'.nd',
                  b'.sda',
              )
              # file extension that also use a `-SOMELONGIDHASH.ext` form
              REVLOG_FILES_LONG_EXT = (
                  b'.nd',
                  b'.idx',
                  b'.dat',
                  b'.sda',
              )
              # files that are "volatile" and might change between listing and streaming
              #
              # note: the ".nd" file are nodemap data and won't "change" but they might be
              # deleted.
              REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
              # some exception to the above matching
              #
              # XXX This is currently not in use because of issue6542
              EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')
              def is_revlog(f, kind, st):
                  if kind != stat.S_IFREG:
                      return None
                  return revlog_type(f)
              def revlog_type(f):
                  # XXX we need to filter `undo.` created by the transaction here, however
                  # being naive about it also filter revlog for `undo.*` files, leading to
                  # issue6542. So we no longer use EXCLUDED.
                  if f.endswith(REVLOG_FILES_MAIN_EXT):
                      return FILEFLAGS_REVLOG_MAIN
                  elif f.endswith(REVLOG_FILES_OTHER_EXT):
                      t = FILETYPE_FILELOG_OTHER
                      if f.endswith(REVLOG_FILES_VOLATILE_EXT):
                          t |= FILEFLAGS_VOLATILE
                      return t
                  return None
              # the file is part of changelog data
              FILEFLAGS_CHANGELOG = 1 << 13
              # the file is part of manifest data
              FILEFLAGS_MANIFESTLOG = 1 << 12
              # the file is part of filelog data
              FILEFLAGS_FILELOG = 1 << 11
              # file that are not directly part of a revlog
              FILEFLAGS_OTHER = 1 << 10
              # the main entry point for a revlog
              FILEFLAGS_REVLOG_MAIN = 1 << 1
              # a secondary file for a revlog
              FILEFLAGS_REVLOG_OTHER = 1 << 0
              # files that are "volatile" and might change between listing and streaming
              FILEFLAGS_VOLATILE = 1 << 20
              FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN
              FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER
              FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN
              FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER
              FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN
              FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER
              FILETYPE_OTHER = FILEFLAGS_OTHER
              @attr.s(slots=True, init=False)
              class BaseStoreEntry:
                  """An entry in the store
                  This is returned by `store.walk` and represent some data in the store."""
+             @attr.s(slots=True, init=False)
+             class SimpleStoreEntry(BaseStoreEntry):
+                 """A generic entry in the store"""
+                 is_revlog = False
                  _entry_path = attr.ib()
                  _is_volatile = attr.ib(default=False)
                  _file_size = attr.ib(default=None)
                  def __init__(
                      self,
                      entry_path,
                      is_volatile=False,
                      file_size=None,
                  ):
+                     super().__init__()
                      self._entry_path = entry_path
                      self._is_volatile = is_volatile
                      self._file_size = file_size
                  def files(self):
                      return [
                          StoreFile(
                              unencoded_path=self._entry_path,
                              file_size=self._file_size,
                              is_volatile=self._is_volatile,
                          )
                      ]
              @attr.s(slots=True, init=False)
-             class SimpleStoreEntry(BaseStoreEntry):
-                 """A generic entry in the store"""
-                 is_revlog = False
-             @attr.s(slots=True, init=False)
              class RevlogStoreEntry(BaseStoreEntry):
                  """A revlog entry in the store"""
                  is_revlog = True
                  revlog_type = attr.ib(default=None)
                  target_id = attr.ib(default=None)
-                 is_revlog_main = attr.ib(default=None)
+                 _path_prefix = attr.ib(default=None)
+                 _details = attr.ib(default=None)
                  def __init__(
                      self,
-                     entry_path,
                      revlog_type,
+                     path_prefix,
                      target_id,
-                     is_revlog_main=False,
-                     is_volatile=False,
-                     file_size=None,
+                     details,
                  ):
-                     super().__init__(
-                         entry_path=entry_path,
-                         is_volatile=is_volatile,
-                         file_size=file_size,
+                     )
+                     super().__init__()
                      self.revlog_type = revlog_type
                      self.target_id = target_id
-                     self.is_revlog_main = is_revlog_main
+                     self._path_prefix = path_prefix
+                     assert b'.i' in details, (path_prefix, details)
+                     self._details = details
                  def main_file_path(self):
                      """unencoded path of the main revlog file"""
-                     return self._entry_path
+                     return self._path_prefix + b'.i'
+                 def files(self):
+                     files = []
+                     for ext in sorted(self._details, key=_ext_key):
+                         path = self._path_prefix + ext
+                         data = self._details[ext]
+                         files.append(StoreFile(unencoded_path=path, **data))
+                     return files
              @attr.s(slots=True)
              class StoreFile:
                  """a file matching an entry"""
                  unencoded_path = attr.ib()
-                 _file_size = attr.ib(default=False)
+                 _file_size = attr.ib(default=None)
                  is_volatile = attr.ib(default=False)
                  def file_size(self, vfs):
                      if self._file_size is not None:
                          return self._file_size
                      try:
                          return vfs.stat(self.unencoded_path).st_size
                      except FileNotFoundError:
                          return 0
              def _gather_revlog(files_data):
                  """group files per revlog prefix
                  The returns a two level nested dict. The top level key is the revlog prefix
                  without extension, the second level is all the file "suffix" that were
                  seen for this revlog and arbitrary file data as value.
                  """
                  revlogs = collections.defaultdict(dict)
                  for u, value in files_data:
                      name, ext = _split_revlog_ext(u)
                      revlogs[name][ext] = value
                  return sorted(revlogs.items())
              def _split_revlog_ext(filename):
                  """split the revlog file prefix from the variable extension"""
                  if filename.endswith(REVLOG_FILES_LONG_EXT):
                      char = b'-'
                  else:
                      char = b'.'
                  idx = filename.rfind(char)
                  return filename[:idx], filename[idx:]
              def _ext_key(ext):
                  """a key to order revlog suffix
                  important to issue .i after other entry."""
                  # the only important part of this order is to keep the `.i` last.
                  if ext.endswith(b'.n'):
                      return (0, ext)
                  elif ext.endswith(b'.nd'):
                      return (10, ext)
                  elif ext.endswith(b'.d'):
                      return (20, ext)
                  elif ext.endswith(b'.i'):
                      return (50, ext)
                  else:
                      return (40, ext)
              class basicstore:
                  '''base class for local repository stores'''
                  def __init__(self, path, vfstype):
                      vfs = vfstype(path)
                      self.path = vfs.base
                      self.createmode = _calcmode(vfs)
                      vfs.createmode = self.createmode
                      self.rawvfs = vfs
                      self.vfs = vfsmod.filtervfs(vfs, encodedir)
                      self.opener = self.vfs
                  def join(self, f):
                      return self.path + b'/' + encodedir(f)
                  def _walk(self, relpath, recurse, undecodable=None):
                      '''yields (revlog_type, unencoded, size)'''
                      path = self.path
                      if relpath:
                          path += b'/' + relpath
                      striplen = len(self.path) + 1
                      l = []
                      if self.rawvfs.isdir(path):
                          visit = [path]
                          readdir = self.rawvfs.readdir
                          while visit:
                              p = visit.pop()
                              for f, kind, st in readdir(p, stat=True):
                                  fp = p + b'/' + f
                                  rl_type = is_revlog(f, kind, st)
                                  if rl_type is not None:
                                      n = util.pconvert(fp[striplen:])
                                      l.append((decodedir(n), (rl_type, st.st_size)))
                                  elif kind == stat.S_IFDIR and recurse:
                                      visit.append(fp)
                      l.sort()
                      return l
                  def changelog(self, trypending, concurrencychecker=None):
                      return changelog.changelog(
                          self.vfs,
                          trypending=trypending,
                          concurrencychecker=concurrencychecker,
                      )
                  def manifestlog(self, repo, storenarrowmatch):
                      rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
                      return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
                  def datafiles(
                      self, matcher=None, undecodable=None
                  ) -> Generator[BaseStoreEntry, None, None]:
                      """Like walk, but excluding the changelog and root manifest.
                      When [undecodable] is None, revlogs names that can't be
                      decoded cause an exception. When it is provided, it should
                      be a list and the filenames that can't be decoded are added
                      to it instead. This is very rarely needed."""
                      dirs = [
                          (b'data', FILEFLAGS_FILELOG),
                          (b'meta', FILEFLAGS_MANIFESTLOG),
                      ]
                      for base_dir, rl_type in dirs:
                          files = self._walk(base_dir, True, undecodable=undecodable)
                          files = (f for f in files if f[1][0] is not None)
                          for revlog, details in _gather_revlog(files):
-                             for ext, (t, s) in sorted(details.items()):
-                                 u = revlog + ext
+                             file_details = {}
-                                 revlog_target_id = revlog.split(b'/', 1)[1]
+                             for ext, (t, s) in sorted(details.items()):
+                                 file_details[ext] = {
+                                     'is_volatile': bool(t & FILEFLAGS_VOLATILE),
+                                     'file_size': s,
+                                 }
-                                 yield RevlogStoreEntry(
-                                     entry_path=u,
+                                 path_prefix=revlog,
-                                     revlog_type=rl_type,
-                                     target_id=revlog_target_id,
-                                     is_revlog_main=bool(t & FILEFLAGS_REVLOG_MAIN),
-                                     is_volatile=bool(t & FILEFLAGS_VOLATILE),
-                                     file_size=s,
+                                 details=file_details,
-                                 )
                  def topfiles(self) -> Generator[BaseStoreEntry, None, None]:
                      files = reversed(self._walk(b'', False))
                      changelogs = collections.defaultdict(dict)
                      manifestlogs = collections.defaultdict(dict)
                      for u, (t, s) in files:
                          if u.startswith(b'00changelog'):
                              name, ext = _split_revlog_ext(u)
                              changelogs[name][ext] = (t, s)
                          elif u.startswith(b'00manifest'):
                              name, ext = _split_revlog_ext(u)
                              manifestlogs[name][ext] = (t, s)
                          else:
                              yield SimpleStoreEntry(
                                  entry_path=u,
                                  is_volatile=bool(t & FILEFLAGS_VOLATILE),
                                  file_size=s,
                              )
                      # yield manifest before changelog
                      top_rl = [
                          (manifestlogs, FILEFLAGS_MANIFESTLOG),
                          (changelogs, FILEFLAGS_CHANGELOG),
                      ]
                      assert len(manifestlogs) <= 1
                      assert len(changelogs) <= 1
                      for data, revlog_type in top_rl:
                          for revlog, details in sorted(data.items()):
-                             # (keeping ordering so we get 00changelog.i last)
-                             key = lambda x: _ext_key(x[0])
-                             for ext, (t, s) in sorted(details.items(), key=key):
-                                 u = revlog + ext
+                             file_details = {}
+                             for ext, (t, s) in details.items():
+                                 file_details[ext] = {
+                                     'is_volatile': bool(t & FILEFLAGS_VOLATILE),
+                                     'file_size': s,
+                                 }
-                                 yield RevlogStoreEntry(
-                                     entry_path=u,
+                                 path_prefix=revlog,
-                                     revlog_type=revlog_type,
-                                     target_id=b'',
-                                     is_revlog_main=bool(t & FILEFLAGS_REVLOG_MAIN),
-                                     is_volatile=bool(t & FILEFLAGS_VOLATILE),
-                                     file_size=s,
+                                 details=file_details,
-                                 )
                  def walk(self, matcher=None) -> Generator[BaseStoreEntry, None, None]:
                      """return files related to data storage (ie: revlogs)
                      yields (file_type, unencoded, size)
                      if a matcher is passed, storage files of only those tracked paths
                      are passed with matches the matcher
                      """
                      # yield data files first
                      for x in self.datafiles(matcher):
                          yield x
                      for x in self.topfiles():
                          yield x
                  def copylist(self):
                      return _data
                  def write(self, tr):
                      pass
                  def invalidatecaches(self):
                      pass
                  def markremoved(self, fn):
                      pass
                  def __contains__(self, path):
                      '''Checks if the store contains path'''
                      path = b"/".join((b"data", path))
                      # file?
                      if self.vfs.exists(path + b".i"):
                          return True
                      # dir?
                      if not path.endswith(b"/"):
                          path = path + b"/"
                      return self.vfs.exists(path)
              class encodedstore(basicstore):
                  def __init__(self, path, vfstype):
                      vfs = vfstype(path + b'/store')
                      self.path = vfs.base
                      self.createmode = _calcmode(vfs)
                      vfs.createmode = self.createmode
                      self.rawvfs = vfs
                      self.vfs = vfsmod.filtervfs(vfs, encodefilename)
                      self.opener = self.vfs
                  def _walk(self, relpath, recurse, undecodable=None):
                      old = super()._walk(relpath, recurse)
                      new = []
                      for f1, value in old:
                          try:
                              f2 = decodefilename(f1)
                          except KeyError:
                              if undecodable is None:
                                  msg = _(b'undecodable revlog name %s') % f1
                                  raise error.StorageError(msg)
                              else:
                                  undecodable.append(f1)
                                  continue
                          new.append((f2, value))
                      return new
                  def datafiles(
                      self, matcher=None, undecodable=None
                  ) -> Generator[BaseStoreEntry, None, None]:
                      entries = super(encodedstore, self).datafiles(undecodable=undecodable)
                      for entry in entries:
                          if _match_tracked_entry(entry, matcher):
                              yield entry
                  def join(self, f):
                      return self.path + b'/' + encodefilename(f)
                  def copylist(self):
                      return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
              class fncache:
                  # the filename used to be partially encoded
                  # hence the encodedir/decodedir dance
                  def __init__(self, vfs):
                      self.vfs = vfs
                      self._ignores = set()
                      self.entries = None
                      self._dirty = False
                      # set of new additions to fncache
                      self.addls = set()
                  def ensureloaded(self, warn=None):
                      """read the fncache file if not already read.
                      If the file on disk is corrupted, raise. If warn is provided,
                      warn and keep going instead."""
                      if self.entries is None:
                          self._load(warn)
                  def _load(self, warn=None):
                      '''fill the entries from the fncache file'''
                      self._dirty = False
                      try:
                          fp = self.vfs(b'fncache', mode=b'rb')
                      except IOError:
                          # skip nonexistent file
                          self.entries = set()
                          return
                      self.entries = set()
                      chunk = b''
                      for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
                          chunk += c
                          try:
                              p = chunk.rindex(b'\n')
                              self.entries.update(decodedir(chunk[: p + 1]).splitlines())
                              chunk = chunk[p + 1 :]
                          except ValueError:
                              # substring '\n' not found, maybe the entry is bigger than the
                              # chunksize, so let's keep iterating
                              pass
                      if chunk:
                          msg = _(b"fncache does not ends with a newline")
                          if warn:
                              warn(msg + b'\n')
                          else:
                              raise error.Abort(
                                  msg,
                                  hint=_(
                                      b"use 'hg debugrebuildfncache' to "
                                      b"rebuild the fncache"
                                  ),
                              )
                      self._checkentries(fp, warn)
                      fp.close()
                  def _checkentries(self, fp, warn):
                      """make sure there is no empty string in entries"""
                      if b'' in self.entries:
                          fp.seek(0)
                          for n, line in enumerate(fp):
                              if not line.rstrip(b'\n'):
                                  t = _(b'invalid entry in fncache, line %d') % (n + 1)
                                  if warn:
                                      warn(t + b'\n')
                                  else:
                                      raise error.Abort(t)
                  def write(self, tr):
                      if self._dirty:
                          assert self.entries is not None
                          self.entries = self.entries | self.addls
                          self.addls = set()
                          tr.addbackup(b'fncache')
                          fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
                          if self.entries:
                              fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
                          fp.close()
                          self._dirty = False
                      if self.addls:
                          # if we have just new entries, let's append them to the fncache
                          tr.addbackup(b'fncache')
                          fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
                          if self.addls:
                              fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
                          fp.close()
                          self.entries = None
                          self.addls = set()
                  def addignore(self, fn):
                      self._ignores.add(fn)
                  def add(self, fn):
                      if fn in self._ignores:
                          return
                      if self.entries is None:
                          self._load()
                      if fn not in self.entries:
                          self.addls.add(fn)
                  def remove(self, fn):
                      if self.entries is None:
                          self._load()
                      if fn in self.addls:
                          self.addls.remove(fn)
                          return
                      try:
                          self.entries.remove(fn)
                          self._dirty = True
                      except KeyError:
                          pass
                  def __contains__(self, fn):
                      if fn in self.addls:
                          return True
                      if self.entries is None:
                          self._load()
                      return fn in self.entries
                  def __iter__(self):
                      if self.entries is None:
                          self._load()
                      return iter(self.entries | self.addls)
              class _fncachevfs(vfsmod.proxyvfs):
                  def __init__(self, vfs, fnc, encode):
                      vfsmod.proxyvfs.__init__(self, vfs)
                      self.fncache = fnc
                      self.encode = encode
                  def __call__(self, path, mode=b'r', *args, **kw):
                      encoded = self.encode(path)
                      if (
                          mode not in (b'r', b'rb')
                          and (path.startswith(b'data/') or path.startswith(b'meta/'))
                          and revlog_type(path) is not None
                      ):
                          # do not trigger a fncache load when adding a file that already is
                          # known to exist.
                          notload = self.fncache.entries is None and self.vfs.exists(encoded)
                          if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:
                              # when appending to an existing file, if the file has size zero,
                              # it should be considered as missing. Such zero-size files are
                              # the result of truncation when a transaction is aborted.
                              notload = False
                          if not notload:
                              self.fncache.add(path)
                      return self.vfs(encoded, mode, *args, **kw)
                  def join(self, path):
                      if path:
                          return self.vfs.join(self.encode(path))
                      else:
                          return self.vfs.join(path)
                  def register_file(self, path):
                      """generic hook point to lets fncache steer its stew"""
                      if path.startswith(b'data/') or path.startswith(b'meta/'):
                          self.fncache.add(path)
              class fncachestore(basicstore):
                  def __init__(self, path, vfstype, dotencode):
                      if dotencode:
                          encode = _pathencode
                      else:
                          encode = _plainhybridencode
                      self.encode = encode
                      vfs = vfstype(path + b'/store')
                      self.path = vfs.base
                      self.pathsep = self.path + b'/'
                      self.createmode = _calcmode(vfs)
                      vfs.createmode = self.createmode
                      self.rawvfs = vfs
                      fnc = fncache(vfs)
                      self.fncache = fnc
                      self.vfs = _fncachevfs(vfs, fnc, encode)
                      self.opener = self.vfs
                  def join(self, f):
                      return self.pathsep + self.encode(f)
                  def getsize(self, path):
                      return self.rawvfs.stat(path).st_size
                  def datafiles(
                      self, matcher=None, undecodable=None
                  ) -> Generator[BaseStoreEntry, None, None]:
                      files = ((f, revlog_type(f)) for f in self.fncache)
                      # Note: all files in fncache should be revlog related, However the
                      # fncache might contains such file added by previous version of
                      # Mercurial.
                      files = (f for f in files if f[1] is not None)
                      by_revlog = _gather_revlog(files)
                      for revlog, details in by_revlog:
+                         file_details = {}
                          if revlog.startswith(b'data/'):
                              rl_type = FILEFLAGS_FILELOG
                              revlog_target_id = revlog.split(b'/', 1)[1]
                          elif revlog.startswith(b'meta/'):
                              rl_type = FILEFLAGS_MANIFESTLOG
                              # drop the initial directory and the `00manifest` file part
                              tmp = revlog.split(b'/', 1)[1]
                              revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'
                          else:
                              # unreachable
                              assert False, revlog
-                         for ext, t in sorted(details.items()):
-                             f = revlog + ext
+                         for ext, t in details.items():
+                             file_details[ext] = {
+                                 'is_volatile': bool(t & FILEFLAGS_VOLATILE),
+                             }
-                             entry = RevlogStoreEntry(
-                                 entry_path=f,
+                             path_prefix=revlog,
-                                 revlog_type=rl_type,
-                                 target_id=revlog_target_id,
-                                 is_revlog_main=bool(t & FILEFLAGS_REVLOG_MAIN),
-                                 is_volatile=bool(t & FILEFLAGS_VOLATILE),
+                             details=file_details,
-                             )
-                             if _match_tracked_entry(entry, matcher):
-                                 yield entry
                  def copylist(self):
                      d = (
                          b'bookmarks',
                          b'narrowspec',
                          b'data',
                          b'meta',
                          b'dh',
                          b'fncache',
                          b'phaseroots',
                          b'obsstore',
                          b'00manifest.d',
                          b'00manifest.i',
                          b'00changelog.d',
                          b'00changelog.i',
                          b'requires',
                      )
                      return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
                  def write(self, tr):
                      self.fncache.write(tr)
                  def invalidatecaches(self):
                      self.fncache.entries = None
                      self.fncache.addls = set()
                  def markremoved(self, fn):
                      self.fncache.remove(fn)
                  def _exists(self, f):
                      ef = self.encode(f)
                      try:
                          self.getsize(ef)
                          return True
                      except FileNotFoundError:
                          return False
                  def __contains__(self, path):
                      '''Checks if the store contains path'''
                      path = b"/".join((b"data", path))
                      # check for files (exact match)
                      e = path + b'.i'
                      if e in self.fncache and self._exists(e):
                          return True
                      # now check for directories (prefix match)
                      if not path.endswith(b'/'):
                          path += b'/'
                      for e in self.fncache:
                          if e.startswith(path) and self._exists(e):
                              return True
                      return False

mercurial/upgrade_utils/engine.py

0 +1 -1

              # upgrade.py - functions for in place upgrade of Mercurial repository
              #
              # Copyright (c) 2016-present, Gregory Szorc
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              import stat
              from ..i18n import _
              from ..pycompat import getattr
              from .. import (
                  changelog,
                  error,
                  filelog,
                  manifest,
                  metadata,
                  pycompat,
                  requirements,
                  scmutil,
                  store,
                  util,
                  vfs as vfsmod,
              )
              from ..revlogutils import (
                  constants as revlogconst,
                  flagutil,
                  nodemap,
                  sidedata as sidedatamod,
              )
              from . import actions as upgrade_actions
              def get_sidedata_helpers(srcrepo, dstrepo):
                  use_w = srcrepo.ui.configbool(b'experimental', b'worker.repository-upgrade')
                  sequential = pycompat.iswindows or not use_w
                  if not sequential:
                      srcrepo.register_sidedata_computer(
                          revlogconst.KIND_CHANGELOG,
                          sidedatamod.SD_FILES,
                          (sidedatamod.SD_FILES,),
                          metadata._get_worker_sidedata_adder(srcrepo, dstrepo),
                          flagutil.REVIDX_HASCOPIESINFO,
                          replace=True,
                      )
                  return sidedatamod.get_sidedata_helpers(srcrepo, dstrepo._wanted_sidedata)
              def _revlog_from_store_entry(repo, entry):
                  """Obtain a revlog from a repo store entry.
                  An instance of the appropriate class is returned.
                  """
                  if entry.revlog_type == store.FILEFLAGS_CHANGELOG:
                      return changelog.changelog(repo.svfs)
                  elif entry.revlog_type == store.FILEFLAGS_MANIFESTLOG:
                      mandir = entry.target_id.rstrip(b'/')
                      return manifest.manifestrevlog(
                          repo.nodeconstants, repo.svfs, tree=mandir
                      )
                  else:
                      return filelog.filelog(repo.svfs, entry.target_id)
              def _copyrevlog(tr, destrepo, oldrl, entry):
                  """copy all relevant files for `oldrl` into `destrepo` store
                  Files are copied "as is" without any transformation. The copy is performed
                  without extra checks. Callers are responsible for making sure the copied
                  content is compatible with format of the destination repository.
                  """
                  oldrl = getattr(oldrl, '_revlog', oldrl)
                  newrl = _revlog_from_store_entry(destrepo, entry)
                  newrl = getattr(newrl, '_revlog', newrl)
                  oldvfs = oldrl.opener
                  newvfs = newrl.opener
                  oldindex = oldvfs.join(oldrl._indexfile)
                  newindex = newvfs.join(newrl._indexfile)
                  olddata = oldvfs.join(oldrl._datafile)
                  newdata = newvfs.join(newrl._datafile)
                  with newvfs(newrl._indexfile, b'w'):
                      pass  # create all the directories
                  util.copyfile(oldindex, newindex)
                  copydata = oldrl.opener.exists(oldrl._datafile)
                  if copydata:
                      util.copyfile(olddata, newdata)
                  if entry.revlog_type & store.FILEFLAGS_FILELOG:
                      unencodedname = entry.main_file_path()
                      destrepo.svfs.fncache.add(unencodedname)
                      if copydata:
                          destrepo.svfs.fncache.add(unencodedname[:-2] + b'.d')
              UPGRADE_CHANGELOG = b"changelog"
              UPGRADE_MANIFEST = b"manifest"
              UPGRADE_FILELOGS = b"all-filelogs"
              UPGRADE_ALL_REVLOGS = frozenset(
                  [UPGRADE_CHANGELOG, UPGRADE_MANIFEST, UPGRADE_FILELOGS]
              )
              def matchrevlog(revlogfilter, rl_type):
                  """check if a revlog is selected for cloning.
                  In other words, are there any updates which need to be done on revlog
                  or it can be blindly copied.
                  The store entry is checked against the passed filter"""
                  if rl_type & store.FILEFLAGS_CHANGELOG:
                      return UPGRADE_CHANGELOG in revlogfilter
                  elif rl_type & store.FILEFLAGS_MANIFESTLOG:
                      return UPGRADE_MANIFEST in revlogfilter
                  assert rl_type & store.FILEFLAGS_FILELOG
                  return UPGRADE_FILELOGS in revlogfilter
              def _perform_clone(
                  ui,
                  dstrepo,
                  tr,
                  old_revlog,
                  entry,
                  upgrade_op,
                  sidedata_helpers,
                  oncopiedrevision,
              ):
                  """returns the new revlog object created"""
                  newrl = None
                  revlog_path = entry.main_file_path()
                  if matchrevlog(upgrade_op.revlogs_to_process, entry.revlog_type):
                      ui.note(
                          _(b'cloning %d revisions from %s\n')
                          % (len(old_revlog), revlog_path)
                      )
                      newrl = _revlog_from_store_entry(dstrepo, entry)
                      old_revlog.clone(
                          tr,
                          newrl,
                          addrevisioncb=oncopiedrevision,
                          deltareuse=upgrade_op.delta_reuse_mode,
                          forcedeltabothparents=upgrade_op.force_re_delta_both_parents,
                          sidedata_helpers=sidedata_helpers,
                      )
                  else:
                      msg = _(b'blindly copying %s containing %i revisions\n')
                      ui.note(msg % (revlog_path, len(old_revlog)))
                      _copyrevlog(tr, dstrepo, old_revlog, entry)
                      newrl = _revlog_from_store_entry(dstrepo, entry)
                  return newrl
              def _clonerevlogs(
                  ui,
                  srcrepo,
                  dstrepo,
                  tr,
                  upgrade_op,
              ):
                  """Copy revlogs between 2 repos."""
                  revcount = 0
                  srcsize = 0
                  srcrawsize = 0
                  dstsize = 0
                  fcount = 0
                  frevcount = 0
                  fsrcsize = 0
                  frawsize = 0
                  fdstsize = 0
                  mcount = 0
                  mrevcount = 0
                  msrcsize = 0
                  mrawsize = 0
                  mdstsize = 0
                  crevcount = 0
                  csrcsize = 0
                  crawsize = 0
                  cdstsize = 0
                  alldatafiles = list(srcrepo.store.walk())
                  # mapping of data files which needs to be cloned
                  # key is unencoded filename
                  # value is revlog_object_from_srcrepo
                  manifests = {}
                  changelogs = {}
                  filelogs = {}
                  # Perform a pass to collect metadata. This validates we can open all
                  # source files and allows a unified progress bar to be displayed.
                  for entry in alldatafiles:
-                     if not (entry.is_revlog and entry.is_revlog_main):
+                     if not entry.is_revlog:
                          continue
                      rl = _revlog_from_store_entry(srcrepo, entry)
                      info = rl.storageinfo(
                          exclusivefiles=True,
                          revisionscount=True,
                          trackedsize=True,
                          storedsize=True,
                      )
                      revcount += info[b'revisionscount'] or 0
                      datasize = info[b'storedsize'] or 0
                      rawsize = info[b'trackedsize'] or 0
                      srcsize += datasize
                      srcrawsize += rawsize
                      # This is for the separate progress bars.
                      if entry.revlog_type & store.FILEFLAGS_CHANGELOG:
                          changelogs[entry.target_id] = entry
                          crevcount += len(rl)
                          csrcsize += datasize
                          crawsize += rawsize
                      elif entry.revlog_type & store.FILEFLAGS_MANIFESTLOG:
                          manifests[entry.target_id] = entry
                          mcount += 1
                          mrevcount += len(rl)
                          msrcsize += datasize
                          mrawsize += rawsize
                      elif entry.revlog_type & store.FILEFLAGS_FILELOG:
                          filelogs[entry.target_id] = entry
                          fcount += 1
                          frevcount += len(rl)
                          fsrcsize += datasize
                          frawsize += rawsize
                      else:
                          error.ProgrammingError(b'unknown revlog type')
                  if not revcount:
                      return
                  ui.status(
                      _(
                          b'migrating %d total revisions (%d in filelogs, %d in manifests, '
                          b'%d in changelog)\n'
                      )
                      % (revcount, frevcount, mrevcount, crevcount)
                  )
                  ui.status(
                      _(b'migrating %s in store; %s tracked data\n')
                      % ((util.bytecount(srcsize), util.bytecount(srcrawsize)))
                  )
                  # Used to keep track of progress.
                  progress = None
                  def oncopiedrevision(rl, rev, node):
                      progress.increment()
                  sidedata_helpers = get_sidedata_helpers(srcrepo, dstrepo)
                  # Migrating filelogs
                  ui.status(
                      _(
                          b'migrating %d filelogs containing %d revisions '
                          b'(%s in store; %s tracked data)\n'
                      )
                      % (
                          fcount,
                          frevcount,
                          util.bytecount(fsrcsize),
                          util.bytecount(frawsize),
                      )
                  )
                  progress = srcrepo.ui.makeprogress(_(b'file revisions'), total=frevcount)
                  for target_id, entry in sorted(filelogs.items()):
                      oldrl = _revlog_from_store_entry(srcrepo, entry)
                      newrl = _perform_clone(
                          ui,
                          dstrepo,
                          tr,
                          oldrl,
                          entry,
                          upgrade_op,
                          sidedata_helpers,
                          oncopiedrevision,
                      )
                      info = newrl.storageinfo(storedsize=True)
                      fdstsize += info[b'storedsize'] or 0
                  ui.status(
                      _(
                          b'finished migrating %d filelog revisions across %d '
                          b'filelogs; change in size: %s\n'
                      )
                      % (frevcount, fcount, util.bytecount(fdstsize - fsrcsize))
                  )
                  # Migrating manifests
                  ui.status(
                      _(
                          b'migrating %d manifests containing %d revisions '
                          b'(%s in store; %s tracked data)\n'
                      )
                      % (
                          mcount,
                          mrevcount,
                          util.bytecount(msrcsize),
                          util.bytecount(mrawsize),
                      )
                  )
                  if progress:
                      progress.complete()
                  progress = srcrepo.ui.makeprogress(
                      _(b'manifest revisions'), total=mrevcount
                  )
                  for target_id, entry in sorted(manifests.items()):
                      oldrl = _revlog_from_store_entry(srcrepo, entry)
                      newrl = _perform_clone(
                          ui,
                          dstrepo,
                          tr,
                          oldrl,
                          entry,
                          upgrade_op,
                          sidedata_helpers,
                          oncopiedrevision,
                      )
                      info = newrl.storageinfo(storedsize=True)
                      mdstsize += info[b'storedsize'] or 0
                  ui.status(
                      _(
                          b'finished migrating %d manifest revisions across %d '
                          b'manifests; change in size: %s\n'
                      )
                      % (mrevcount, mcount, util.bytecount(mdstsize - msrcsize))
                  )
                  # Migrating changelog
                  ui.status(
                      _(
                          b'migrating changelog containing %d revisions '
                          b'(%s in store; %s tracked data)\n'
                      )
                      % (
                          crevcount,
                          util.bytecount(csrcsize),
                          util.bytecount(crawsize),
                      )
                  )
                  if progress:
                      progress.complete()
                  progress = srcrepo.ui.makeprogress(
                      _(b'changelog revisions'), total=crevcount
                  )
                  for target_id, entry in sorted(changelogs.items()):
                      oldrl = _revlog_from_store_entry(srcrepo, entry)
                      newrl = _perform_clone(
                          ui,
                          dstrepo,
                          tr,
                          oldrl,
                          entry,
                          upgrade_op,
                          sidedata_helpers,
                          oncopiedrevision,
                      )
                      info = newrl.storageinfo(storedsize=True)
                      cdstsize += info[b'storedsize'] or 0
                  progress.complete()
                  ui.status(
                      _(
                          b'finished migrating %d changelog revisions; change in size: '
                          b'%s\n'
                      )
                      % (crevcount, util.bytecount(cdstsize - csrcsize))
                  )
                  dstsize = fdstsize + mdstsize + cdstsize
                  ui.status(
                      _(
                          b'finished migrating %d total revisions; total change in store '
                          b'size: %s\n'
                      )
                      % (revcount, util.bytecount(dstsize - srcsize))
                  )
              def _files_to_copy_post_revlog_clone(srcrepo):
                  """yields files which should be copied to destination after revlogs
                  are cloned"""
                  for path, kind, st in sorted(srcrepo.store.vfs.readdir(b'', stat=True)):
                      # don't copy revlogs as they are already cloned
                      if store.revlog_type(path) is not None:
                          continue
                      # Skip transaction related files.
                      if path.startswith(b'undo'):
                          continue
                      # Only copy regular files.
                      if kind != stat.S_IFREG:
                          continue
                      # Skip other skipped files.
                      if path in (b'lock', b'fncache'):
                          continue
                      # TODO: should we skip cache too?
                      yield path
              def _replacestores(currentrepo, upgradedrepo, backupvfs, upgrade_op):
                  """Replace the stores after current repository is upgraded
                  Creates a backup of current repository store at backup path
                  Replaces upgraded store files in current repo from upgraded one
                  Arguments:
                    currentrepo: repo object of current repository
                    upgradedrepo: repo object of the upgraded data
                    backupvfs: vfs object for the backup path
                    upgrade_op: upgrade operation object
                                to be used to decide what all is upgraded
                  """
                  # TODO: don't blindly rename everything in store
                  # There can be upgrades where store is not touched at all
                  if upgrade_op.backup_store:
                      util.rename(currentrepo.spath, backupvfs.join(b'store'))
                  else:
                      currentrepo.vfs.rmtree(b'store', forcibly=True)
                  util.rename(upgradedrepo.spath, currentrepo.spath)
              def finishdatamigration(ui, srcrepo, dstrepo, requirements):
                  """Hook point for extensions to perform additional actions during upgrade.
                  This function is called after revlogs and store files have been copied but
                  before the new store is swapped into the original location.
                  """
              def upgrade(ui, srcrepo, dstrepo, upgrade_op):
                  """Do the low-level work of upgrading a repository.
                  The upgrade is effectively performed as a copy between a source
                  repository and a temporary destination repository.
                  The source repository is unmodified for as long as possible so the
                  upgrade can abort at any time without causing loss of service for
                  readers and without corrupting the source repository.
                  """
                  assert srcrepo.currentwlock()
                  assert dstrepo.currentwlock()
                  backuppath = None
                  backupvfs = None
                  ui.status(
                      _(
                          b'(it is safe to interrupt this process any time before '
                          b'data migration completes)\n'
                      )
                  )
                  if upgrade_actions.dirstatev2 in upgrade_op.upgrade_actions:
                      ui.status(_(b'upgrading to dirstate-v2 from v1\n'))
                      upgrade_dirstate(ui, srcrepo, upgrade_op, b'v1', b'v2')
                      upgrade_op.upgrade_actions.remove(upgrade_actions.dirstatev2)
                  if upgrade_actions.dirstatev2 in upgrade_op.removed_actions:
                      ui.status(_(b'downgrading from dirstate-v2 to v1\n'))
                      upgrade_dirstate(ui, srcrepo, upgrade_op, b'v2', b'v1')
                      upgrade_op.removed_actions.remove(upgrade_actions.dirstatev2)
                  if upgrade_actions.dirstatetrackedkey in upgrade_op.upgrade_actions:
                      ui.status(_(b'create dirstate-tracked-hint file\n'))
                      upgrade_tracked_hint(ui, srcrepo, upgrade_op, add=True)
                      upgrade_op.upgrade_actions.remove(upgrade_actions.dirstatetrackedkey)
                  elif upgrade_actions.dirstatetrackedkey in upgrade_op.removed_actions:
                      ui.status(_(b'remove dirstate-tracked-hint file\n'))
                      upgrade_tracked_hint(ui, srcrepo, upgrade_op, add=False)
                      upgrade_op.removed_actions.remove(upgrade_actions.dirstatetrackedkey)
                  if not (upgrade_op.upgrade_actions or upgrade_op.removed_actions):
                      return
                  if upgrade_op.requirements_only:
                      ui.status(_(b'upgrading repository requirements\n'))
                      scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)
                  # if there is only one action and that is persistent nodemap upgrade
                  # directly write the nodemap file and update requirements instead of going
                  # through the whole cloning process
                  elif (
                      len(upgrade_op.upgrade_actions) == 1
                      and b'persistent-nodemap' in upgrade_op.upgrade_actions_names
                      and not upgrade_op.removed_actions
                  ):
                      ui.status(
                          _(b'upgrading repository to use persistent nodemap feature\n')
                      )
                      with srcrepo.transaction(b'upgrade') as tr:
                          unfi = srcrepo.unfiltered()
                          cl = unfi.changelog
                          nodemap.persist_nodemap(tr, cl, force=True)
                          # we want to directly operate on the underlying revlog to force
                          # create a nodemap file. This is fine since this is upgrade code
                          # and it heavily relies on repository being revlog based
                          # hence accessing private attributes can be justified
                          nodemap.persist_nodemap(
                              tr, unfi.manifestlog._rootstore._revlog, force=True
                          )
                      scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)
                  elif (
                      len(upgrade_op.removed_actions) == 1
                      and [
                          x
                          for x in upgrade_op.removed_actions
                          if x.name == b'persistent-nodemap'
                      ]
                      and not upgrade_op.upgrade_actions
                  ):
                      ui.status(
                          _(b'downgrading repository to not use persistent nodemap feature\n')
                      )
                      with srcrepo.transaction(b'upgrade') as tr:
                          unfi = srcrepo.unfiltered()
                          cl = unfi.changelog
                          nodemap.delete_nodemap(tr, srcrepo, cl)
                          # check comment 20 lines above for accessing private attributes
                          nodemap.delete_nodemap(
                              tr, srcrepo, unfi.manifestlog._rootstore._revlog
                          )
                      scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)
                  else:
                      with dstrepo.transaction(b'upgrade') as tr:
                          _clonerevlogs(
                              ui,
                              srcrepo,
                              dstrepo,
                              tr,
                              upgrade_op,
                          )
                      # Now copy other files in the store directory.
                      for p in _files_to_copy_post_revlog_clone(srcrepo):
                          srcrepo.ui.status(_(b'copying %s\n') % p)
                          src = srcrepo.store.rawvfs.join(p)
                          dst = dstrepo.store.rawvfs.join(p)
                          util.copyfile(src, dst, copystat=True)
                      finishdatamigration(ui, srcrepo, dstrepo, requirements)
                      ui.status(_(b'data fully upgraded in a temporary repository\n'))
                      if upgrade_op.backup_store:
                          backuppath = pycompat.mkdtemp(
                              prefix=b'upgradebackup.', dir=srcrepo.path
                          )
                          backupvfs = vfsmod.vfs(backuppath)
                          # Make a backup of requires file first, as it is the first to be modified.
                          util.copyfile(
                              srcrepo.vfs.join(b'requires'), backupvfs.join(b'requires')
                          )
                      # We install an arbitrary requirement that clients must not support
                      # as a mechanism to lock out new clients during the data swap. This is
                      # better than allowing a client to continue while the repository is in
                      # an inconsistent state.
                      ui.status(
                          _(
                              b'marking source repository as being upgraded; clients will be '
                              b'unable to read from repository\n'
                          )
                      )
                      scmutil.writereporequirements(
                          srcrepo, srcrepo.requirements | {b'upgradeinprogress'}
                      )
                      ui.status(_(b'starting in-place swap of repository data\n'))
                      if upgrade_op.backup_store:
                          ui.status(
                              _(b'replaced files will be backed up at %s\n') % backuppath
                          )
                      # Now swap in the new store directory. Doing it as a rename should make
                      # the operation nearly instantaneous and atomic (at least in well-behaved
                      # environments).
                      ui.status(_(b'replacing store...\n'))
                      tstart = util.timer()
                      _replacestores(srcrepo, dstrepo, backupvfs, upgrade_op)
                      elapsed = util.timer() - tstart
                      ui.status(
                          _(
                              b'store replacement complete; repository was inconsistent for '
                              b'%0.1fs\n'
                          )
                          % elapsed
                      )
                      # We first write the requirements file. Any new requirements will lock
                      # out legacy clients.
                      ui.status(
                          _(
                              b'finalizing requirements file and making repository readable '
                              b'again\n'
                          )
                      )
                      scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)
                      if upgrade_op.backup_store:
                          # The lock file from the old store won't be removed because nothing has a
                          # reference to its new location. So clean it up manually. Alternatively, we
                          # could update srcrepo.svfs and other variables to point to the new
                          # location. This is simpler.
                          assert backupvfs is not None  # help pytype
                          backupvfs.unlink(b'store/lock')
                  return backuppath
              def upgrade_dirstate(ui, srcrepo, upgrade_op, old, new):
                  if upgrade_op.backup_store:
                      backuppath = pycompat.mkdtemp(
                          prefix=b'upgradebackup.', dir=srcrepo.path
                      )
                      ui.status(_(b'replaced files will be backed up at %s\n') % backuppath)
                      backupvfs = vfsmod.vfs(backuppath)
                      util.copyfile(
                          srcrepo.vfs.join(b'requires'), backupvfs.join(b'requires')
                      )
                      try:
                          util.copyfile(
                              srcrepo.vfs.join(b'dirstate'), backupvfs.join(b'dirstate')
                          )
                      except FileNotFoundError:
                          # The dirstate does not exist on an empty repo or a repo with no
                          # revision checked out
                          pass
                  assert srcrepo.dirstate._use_dirstate_v2 == (old == b'v2')
                  use_v2 = new == b'v2'
                  if use_v2:
                      # Write the requirements *before* upgrading
                      scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)
                  srcrepo.dirstate._map.preload()
                  srcrepo.dirstate._use_dirstate_v2 = use_v2
                  srcrepo.dirstate._map._use_dirstate_v2 = use_v2
                  srcrepo.dirstate._dirty = True
                  try:
                      srcrepo.vfs.unlink(b'dirstate')
                  except FileNotFoundError:
                      # The dirstate does not exist on an empty repo or a repo with no
                      # revision checked out
                      pass
                  srcrepo.dirstate.write(None)
                  if not use_v2:
                      # Remove the v2 requirement *after* downgrading
                      scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)
              def upgrade_tracked_hint(ui, srcrepo, upgrade_op, add):
                  if add:
                      srcrepo.dirstate._use_tracked_hint = True
                      srcrepo.dirstate._dirty = True
                      srcrepo.dirstate._dirty_tracked_set = True
                      srcrepo.dirstate.write(None)
                  if not add:
                      srcrepo.dirstate.delete_tracked_hint()
                  scmutil.writereporequirements(srcrepo, upgrade_op.new_requirements)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages