upstream/mercurial-mirror Commit - r48139:04d1f17f

dirstate-v2: Write .hg/dirstate back to disk on directory cache changes...

Simon Sapin -

r48139:04d1f17f default

parent child

mercurial/context.py

0 +1 -1

              # context.py - changeset and file context objects for mercurial
              #
              # Copyright 2006, 2007 Olivia Mackall <olivia@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import errno
              import filecmp
              import os
              import stat
              from .i18n import _
              from .node import (
                  hex,
                  nullrev,
                  short,
              )
              from .pycompat import (
                  getattr,
                  open,
              )
              from . import (
                  dagop,
                  encoding,
                  error,
                  fileset,
                  match as matchmod,
                  mergestate as mergestatemod,
                  metadata,
                  obsolete as obsmod,
                  patch,
                  pathutil,
                  phases,
                  pycompat,
                  repoview,
                  scmutil,
                  sparse,
                  subrepo,
                  subrepoutil,
                  util,
              )
              from .utils import (
                  dateutil,
                  stringutil,
              )
              propertycache = util.propertycache
              class basectx(object):
                  """A basectx object represents the common logic for its children:
                  changectx: read-only context that is already present in the repo,
                  workingctx: a context that represents the working directory and can
                              be committed,
                  memctx: a context that represents changes in-memory and can also
                          be committed."""
                  def __init__(self, repo):
                      self._repo = repo
                  def __bytes__(self):
                      return short(self.node())
                  __str__ = encoding.strmethod(__bytes__)
                  def __repr__(self):
                      return "<%s %s>" % (type(self).__name__, str(self))
                  def __eq__(self, other):
                      try:
                          return type(self) == type(other) and self._rev == other._rev
                      except AttributeError:
                          return False
                  def __ne__(self, other):
                      return not (self == other)
                  def __contains__(self, key):
                      return key in self._manifest
                  def __getitem__(self, key):
                      return self.filectx(key)
                  def __iter__(self):
                      return iter(self._manifest)
                  def _buildstatusmanifest(self, status):
                      """Builds a manifest that includes the given status results, if this is
                      a working copy context. For non-working copy contexts, it just returns
                      the normal manifest."""
                      return self.manifest()
                  def _matchstatus(self, other, match):
                      """This internal method provides a way for child objects to override the
                      match operator.
                      """
                      return match
                  def _buildstatus(
                      self, other, s, match, listignored, listclean, listunknown
                  ):
                      """build a status with respect to another context"""
                      # Load earliest manifest first for caching reasons. More specifically,
                      # if you have revisions 1000 and 1001, 1001 is probably stored as a
                      # delta against 1000. Thus, if you read 1000 first, we'll reconstruct
                      # 1000 and cache it so that when you read 1001, we just need to apply a
                      # delta to what's in the cache. So that's one full reconstruction + one
                      # delta application.
                      mf2 = None
                      if self.rev() is not None and self.rev() < other.rev():
                          mf2 = self._buildstatusmanifest(s)
                      mf1 = other._buildstatusmanifest(s)
                      if mf2 is None:
                          mf2 = self._buildstatusmanifest(s)
                      modified, added = [], []
                      removed = []
                      clean = []
                      deleted, unknown, ignored = s.deleted, s.unknown, s.ignored
                      deletedset = set(deleted)
                      d = mf1.diff(mf2, match=match, clean=listclean)
                      for fn, value in pycompat.iteritems(d):
                          if fn in deletedset:
                              continue
                          if value is None:
                              clean.append(fn)
                              continue
                          (node1, flag1), (node2, flag2) = value
                          if node1 is None:
                              added.append(fn)
                          elif node2 is None:
                              removed.append(fn)
                          elif flag1 != flag2:
                              modified.append(fn)
                          elif node2 not in self._repo.nodeconstants.wdirfilenodeids:
                              # When comparing files between two commits, we save time by
                              # not comparing the file contents when the nodeids differ.
                              # Note that this means we incorrectly report a reverted change
                              # to a file as a modification.
                              modified.append(fn)
                          elif self[fn].cmp(other[fn]):
                              modified.append(fn)
                          else:
                              clean.append(fn)
                      if removed:
                          # need to filter files if they are already reported as removed
                          unknown = [
                              fn
                              for fn in unknown
                              if fn not in mf1 and (not match or match(fn))
                          ]
                          ignored = [
                              fn
                              for fn in ignored
                              if fn not in mf1 and (not match or match(fn))
                          ]
                          # if they're deleted, don't report them as removed
                          removed = [fn for fn in removed if fn not in deletedset]
                      return scmutil.status(
                          modified, added, removed, deleted, unknown, ignored, clean
                      )
                  @propertycache
                  def substate(self):
                      return subrepoutil.state(self, self._repo.ui)
                  def subrev(self, subpath):
                      return self.substate[subpath][1]
                  def rev(self):
                      return self._rev
                  def node(self):
                      return self._node
                  def hex(self):
                      return hex(self.node())
                  def manifest(self):
                      return self._manifest
                  def manifestctx(self):
                      return self._manifestctx
                  def repo(self):
                      return self._repo
                  def phasestr(self):
                      return phases.phasenames[self.phase()]
                  def mutable(self):
                      return self.phase() > phases.public
                  def matchfileset(self, cwd, expr, badfn=None):
                      return fileset.match(self, cwd, expr, badfn=badfn)
                  def obsolete(self):
                      """True if the changeset is obsolete"""
                      return self.rev() in obsmod.getrevs(self._repo, b'obsolete')
                  def extinct(self):
                      """True if the changeset is extinct"""
                      return self.rev() in obsmod.getrevs(self._repo, b'extinct')
                  def orphan(self):
                      """True if the changeset is not obsolete, but its ancestor is"""
                      return self.rev() in obsmod.getrevs(self._repo, b'orphan')
                  def phasedivergent(self):
                      """True if the changeset tries to be a successor of a public changeset
                      Only non-public and non-obsolete changesets may be phase-divergent.
                      """
                      return self.rev() in obsmod.getrevs(self._repo, b'phasedivergent')
                  def contentdivergent(self):
                      """Is a successor of a changeset with multiple possible successor sets
                      Only non-public and non-obsolete changesets may be content-divergent.
                      """
                      return self.rev() in obsmod.getrevs(self._repo, b'contentdivergent')
                  def isunstable(self):
                      """True if the changeset is either orphan, phase-divergent or
                      content-divergent"""
                      return self.orphan() or self.phasedivergent() or self.contentdivergent()
                  def instabilities(self):
                      """return the list of instabilities affecting this changeset.
                      Instabilities are returned as strings. possible values are:
                      - orphan,
                      - phase-divergent,
                      - content-divergent.
                      """
                      instabilities = []
                      if self.orphan():
                          instabilities.append(b'orphan')
                      if self.phasedivergent():
                          instabilities.append(b'phase-divergent')
                      if self.contentdivergent():
                          instabilities.append(b'content-divergent')
                      return instabilities
                  def parents(self):
                      """return contexts for each parent changeset"""
                      return self._parents
                  def p1(self):
                      return self._parents[0]
                  def p2(self):
                      parents = self._parents
                      if len(parents) == 2:
                          return parents[1]
                      return self._repo[nullrev]
                  def _fileinfo(self, path):
                      if '_manifest' in self.__dict__:
                          try:
                              return self._manifest.find(path)
                          except KeyError:
                              raise error.ManifestLookupError(
                                  self._node or b'None', path, _(b'not found in manifest')
                              )
                      if '_manifestdelta' in self.__dict__ or path in self.files():
                          if path in self._manifestdelta:
                              return (
                                  self._manifestdelta[path],
                                  self._manifestdelta.flags(path),
                              )
                      mfl = self._repo.manifestlog
                      try:
                          node, flag = mfl[self._changeset.manifest].find(path)
                      except KeyError:
                          raise error.ManifestLookupError(
                              self._node or b'None', path, _(b'not found in manifest')
                          )
                      return node, flag
                  def filenode(self, path):
                      return self._fileinfo(path)[0]
                  def flags(self, path):
                      try:
                          return self._fileinfo(path)[1]
                      except error.LookupError:
                          return b''
                  @propertycache
                  def _copies(self):
                      return metadata.computechangesetcopies(self)
                  def p1copies(self):
                      return self._copies[0]
                  def p2copies(self):
                      return self._copies[1]
                  def sub(self, path, allowcreate=True):
                      '''return a subrepo for the stored revision of path, never wdir()'''
                      return subrepo.subrepo(self, path, allowcreate=allowcreate)
                  def nullsub(self, path, pctx):
                      return subrepo.nullsubrepo(self, path, pctx)
                  def workingsub(self, path):
                      """return a subrepo for the stored revision, or wdir if this is a wdir
                      context.
                      """
                      return subrepo.subrepo(self, path, allowwdir=True)
                  def match(
                      self,
                      pats=None,
                      include=None,
                      exclude=None,
                      default=b'glob',
                      listsubrepos=False,
                      badfn=None,
                      cwd=None,
                  ):
                      r = self._repo
                      if not cwd:
                          cwd = r.getcwd()
                      return matchmod.match(
                          r.root,
                          cwd,
                          pats,
                          include,
                          exclude,
                          default,
                          auditor=r.nofsauditor,
                          ctx=self,
                          listsubrepos=listsubrepos,
                          badfn=badfn,
                      )
                  def diff(
                      self,
                      ctx2=None,
                      match=None,
                      changes=None,
                      opts=None,
                      losedatafn=None,
                      pathfn=None,
                      copy=None,
                      copysourcematch=None,
                      hunksfilterfn=None,
                  ):
                      """Returns a diff generator for the given contexts and matcher"""
                      if ctx2 is None:
                          ctx2 = self.p1()
                      if ctx2 is not None:
                          ctx2 = self._repo[ctx2]
                      return patch.diff(
                          self._repo,
                          ctx2,
                          self,
                          match=match,
                          changes=changes,
                          opts=opts,
                          losedatafn=losedatafn,
                          pathfn=pathfn,
                          copy=copy,
                          copysourcematch=copysourcematch,
                          hunksfilterfn=hunksfilterfn,
                      )
                  def dirs(self):
                      return self._manifest.dirs()
                  def hasdir(self, dir):
                      return self._manifest.hasdir(dir)
                  def status(
                      self,
                      other=None,
                      match=None,
                      listignored=False,
                      listclean=False,
                      listunknown=False,
                      listsubrepos=False,
                  ):
                      """return status of files between two nodes or node and working
                      directory.
                      If other is None, compare this node with working directory.
                      ctx1.status(ctx2) returns the status of change from ctx1 to ctx2
                      Returns a mercurial.scmutils.status object.
                      Data can be accessed using either tuple notation:
                          (modified, added, removed, deleted, unknown, ignored, clean)
                      or direct attribute access:
                          s.modified, s.added, ...
                      """
                      ctx1 = self
                      ctx2 = self._repo[other]
                      # This next code block is, admittedly, fragile logic that tests for
                      # reversing the contexts and wouldn't need to exist if it weren't for
                      # the fast (and common) code path of comparing the working directory
                      # with its first parent.
                      #
                      # What we're aiming for here is the ability to call:
                      #
                      # workingctx.status(parentctx)
                      #
                      # If we always built the manifest for each context and compared those,
                      # then we'd be done. But the special case of the above call means we
                      # just copy the manifest of the parent.
                      reversed = False
                      if not isinstance(ctx1, changectx) and isinstance(ctx2, changectx):
                          reversed = True
                          ctx1, ctx2 = ctx2, ctx1
                      match = self._repo.narrowmatch(match)
                      match = ctx2._matchstatus(ctx1, match)
                      r = scmutil.status([], [], [], [], [], [], [])
                      r = ctx2._buildstatus(
                          ctx1, r, match, listignored, listclean, listunknown
                      )
                      if reversed:
                          # Reverse added and removed. Clear deleted, unknown and ignored as
                          # these make no sense to reverse.
                          r = scmutil.status(
                              r.modified, r.removed, r.added, [], [], [], r.clean
                          )
                      if listsubrepos:
                          for subpath, sub in scmutil.itersubrepos(ctx1, ctx2):
                              try:
                                  rev2 = ctx2.subrev(subpath)
                              except KeyError:
                                  # A subrepo that existed in node1 was deleted between
                                  # node1 and node2 (inclusive). Thus, ctx2's substate
                                  # won't contain that subpath. The best we can do ignore it.
                                  rev2 = None
                              submatch = matchmod.subdirmatcher(subpath, match)
                              s = sub.status(
                                  rev2,
                                  match=submatch,
                                  ignored=listignored,
                                  clean=listclean,
                                  unknown=listunknown,
                                  listsubrepos=True,
                              )
                              for k in (
                                  'modified',
                                  'added',
                                  'removed',
                                  'deleted',
                                  'unknown',
                                  'ignored',
                                  'clean',
                              ):
                                  rfiles, sfiles = getattr(r, k), getattr(s, k)
                                  rfiles.extend(b"%s/%s" % (subpath, f) for f in sfiles)
                      r.modified.sort()
                      r.added.sort()
                      r.removed.sort()
                      r.deleted.sort()
                      r.unknown.sort()
                      r.ignored.sort()
                      r.clean.sort()
                      return r
                  def mergestate(self, clean=False):
                      """Get a mergestate object for this context."""
                      raise NotImplementedError(
                          '%s does not implement mergestate()' % self.__class__
                      )
                  def isempty(self):
                      return not (
                          len(self.parents()) > 1
                          or self.branch() != self.p1().branch()
                          or self.closesbranch()
                          or self.files()
                      )
              class changectx(basectx):
                  """A changecontext object makes access to data related to a particular
                  changeset convenient. It represents a read-only context already present in
                  the repo."""
                  def __init__(self, repo, rev, node, maybe_filtered=True):
                      super(changectx, self).__init__(repo)
                      self._rev = rev
                      self._node = node
                      # When maybe_filtered is True, the revision might be affected by
                      # changelog filtering and operation through the filtered changelog must be used.
                      #
                      # When maybe_filtered is False, the revision has already been checked
                      # against filtering and is not filtered. Operation through the
                      # unfiltered changelog might be used in some case.
                      self._maybe_filtered = maybe_filtered
                  def __hash__(self):
                      try:
                          return hash(self._rev)
                      except AttributeError:
                          return id(self)
                  def __nonzero__(self):
                      return self._rev != nullrev
                  __bool__ = __nonzero__
                  @propertycache
                  def _changeset(self):
                      if self._maybe_filtered:
                          repo = self._repo
                      else:
                          repo = self._repo.unfiltered()
                      return repo.changelog.changelogrevision(self.rev())
                  @propertycache
                  def _manifest(self):
                      return self._manifestctx.read()
                  @property
                  def _manifestctx(self):
                      return self._repo.manifestlog[self._changeset.manifest]
                  @propertycache
                  def _manifestdelta(self):
                      return self._manifestctx.readdelta()
                  @propertycache
                  def _parents(self):
                      repo = self._repo
                      if self._maybe_filtered:
                          cl = repo.changelog
                      else:
                          cl = repo.unfiltered().changelog
                      p1, p2 = cl.parentrevs(self._rev)
                      if p2 == nullrev:
                          return [changectx(repo, p1, cl.node(p1), maybe_filtered=False)]
                      return [
                          changectx(repo, p1, cl.node(p1), maybe_filtered=False),
                          changectx(repo, p2, cl.node(p2), maybe_filtered=False),
                      ]
                  def changeset(self):
                      c = self._changeset
                      return (
                          c.manifest,
                          c.user,
                          c.date,
                          c.files,
                          c.description,
                          c.extra,
                      )
                  def manifestnode(self):
                      return self._changeset.manifest
                  def user(self):
                      return self._changeset.user
                  def date(self):
                      return self._changeset.date
                  def files(self):
                      return self._changeset.files
                  def filesmodified(self):
                      modified = set(self.files())
                      modified.difference_update(self.filesadded())
                      modified.difference_update(self.filesremoved())
                      return sorted(modified)
                  def filesadded(self):
                      filesadded = self._changeset.filesadded
                      compute_on_none = True
                      if self._repo.filecopiesmode == b'changeset-sidedata':
                          compute_on_none = False
                      else:
                          source = self._repo.ui.config(b'experimental', b'copies.read-from')
                          if source == b'changeset-only':
                              compute_on_none = False
                          elif source != b'compatibility':
                              # filelog mode, ignore any changelog content
                              filesadded = None
                      if filesadded is None:
                          if compute_on_none:
                              filesadded = metadata.computechangesetfilesadded(self)
                          else:
                              filesadded = []
                      return filesadded
                  def filesremoved(self):
                      filesremoved = self._changeset.filesremoved
                      compute_on_none = True
                      if self._repo.filecopiesmode == b'changeset-sidedata':
                          compute_on_none = False
                      else:
                          source = self._repo.ui.config(b'experimental', b'copies.read-from')
                          if source == b'changeset-only':
                              compute_on_none = False
                          elif source != b'compatibility':
                              # filelog mode, ignore any changelog content
                              filesremoved = None
                      if filesremoved is None:
                          if compute_on_none:
                              filesremoved = metadata.computechangesetfilesremoved(self)
                          else:
                              filesremoved = []
                      return filesremoved
                  @propertycache
                  def _copies(self):
                      p1copies = self._changeset.p1copies
                      p2copies = self._changeset.p2copies
                      compute_on_none = True
                      if self._repo.filecopiesmode == b'changeset-sidedata':
                          compute_on_none = False
                      else:
                          source = self._repo.ui.config(b'experimental', b'copies.read-from')
                          # If config says to get copy metadata only from changeset, then
                          # return that, defaulting to {} if there was no copy metadata.  In
                          # compatibility mode, we return copy data from the changeset if it
                          # was recorded there, and otherwise we fall back to getting it from
                          # the filelogs (below).
                          #
                          # If we are in compatiblity mode and there is not data in the
                          # changeset), we get the copy metadata from the filelogs.
                          #
                          # otherwise, when config said to read only from filelog, we get the
                          # copy metadata from the filelogs.
                          if source == b'changeset-only':
                              compute_on_none = False
                          elif source != b'compatibility':
                              # filelog mode, ignore any changelog content
                              p1copies = p2copies = None
                      if p1copies is None:
                          if compute_on_none:
                              p1copies, p2copies = super(changectx, self)._copies
                          else:
                              if p1copies is None:
                                  p1copies = {}
                      if p2copies is None:
                          p2copies = {}
                      return p1copies, p2copies
                  def description(self):
                      return self._changeset.description
                  def branch(self):
                      return encoding.tolocal(self._changeset.extra.get(b"branch"))
                  def closesbranch(self):
                      return b'close' in self._changeset.extra
                  def extra(self):
                      """Return a dict of extra information."""
                      return self._changeset.extra
                  def tags(self):
                      """Return a list of byte tag names"""
                      return self._repo.nodetags(self._node)
                  def bookmarks(self):
                      """Return a list of byte bookmark names."""
                      return self._repo.nodebookmarks(self._node)
                  def phase(self):
                      return self._repo._phasecache.phase(self._repo, self._rev)
                  def hidden(self):
                      return self._rev in repoview.filterrevs(self._repo, b'visible')
                  def isinmemory(self):
                      return False
                  def children(self):
                      """return list of changectx contexts for each child changeset.
                      This returns only the immediate child changesets. Use descendants() to
                      recursively walk children.
                      """
                      c = self._repo.changelog.children(self._node)
                      return [self._repo[x] for x in c]
                  def ancestors(self):
                      for a in self._repo.changelog.ancestors([self._rev]):
                          yield self._repo[a]
                  def descendants(self):
                      """Recursively yield all children of the changeset.
                      For just the immediate children, use children()
                      """
                      for d in self._repo.changelog.descendants([self._rev]):
                          yield self._repo[d]
                  def filectx(self, path, fileid=None, filelog=None):
                      """get a file context from this changeset"""
                      if fileid is None:
                          fileid = self.filenode(path)
                      return filectx(
                          self._repo, path, fileid=fileid, changectx=self, filelog=filelog
                      )
                  def ancestor(self, c2, warn=False):
                      """return the "best" ancestor context of self and c2
                      If there are multiple candidates, it will show a message and check
                      merge.preferancestor configuration before falling back to the
                      revlog ancestor."""
                      # deal with workingctxs
                      n2 = c2._node
                      if n2 is None:
                          n2 = c2._parents[0]._node
                      cahs = self._repo.changelog.commonancestorsheads(self._node, n2)
                      if not cahs:
                          anc = self._repo.nodeconstants.nullid
                      elif len(cahs) == 1:
                          anc = cahs[0]
                      else:
                          # experimental config: merge.preferancestor
                          for r in self._repo.ui.configlist(b'merge', b'preferancestor'):
                              try:
                                  ctx = scmutil.revsymbol(self._repo, r)
                              except error.RepoLookupError:
                                  continue
                              anc = ctx.node()
                              if anc in cahs:
                                  break
                          else:
                              anc = self._repo.changelog.ancestor(self._node, n2)
                          if warn:
                              self._repo.ui.status(
                                  (
                                      _(b"note: using %s as ancestor of %s and %s\n")
                                      % (short(anc), short(self._node), short(n2))
                                  )
                                  + b''.join(
                                      _(
                                          b"      alternatively, use --config "
                                          b"merge.preferancestor=%s\n"
                                      )
                                      % short(n)
                                      for n in sorted(cahs)
                                      if n != anc
                                  )
                              )
                      return self._repo[anc]
                  def isancestorof(self, other):
                      """True if this changeset is an ancestor of other"""
                      return self._repo.changelog.isancestorrev(self._rev, other._rev)
                  def walk(self, match):
                      '''Generates matching file names.'''
                      # Wrap match.bad method to have message with nodeid
                      def bad(fn, msg):
                          # The manifest doesn't know about subrepos, so don't complain about
                          # paths into valid subrepos.
                          if any(fn == s or fn.startswith(s + b'/') for s in self.substate):
                              return
                          match.bad(fn, _(b'no such file in rev %s') % self)
                      m = matchmod.badmatch(self._repo.narrowmatch(match), bad)
                      return self._manifest.walk(m)
                  def matches(self, match):
                      return self.walk(match)
              class basefilectx(object):
                  """A filecontext object represents the common logic for its children:
                  filectx: read-only access to a filerevision that is already present
                           in the repo,
                  workingfilectx: a filecontext that represents files from the working
                                  directory,
                  memfilectx: a filecontext that represents files in-memory,
                  """
                  @propertycache
                  def _filelog(self):
                      return self._repo.file(self._path)
                  @propertycache
                  def _changeid(self):
                      if '_changectx' in self.__dict__:
                          return self._changectx.rev()
                      elif '_descendantrev' in self.__dict__:
                          # this file context was created from a revision with a known
                          # descendant, we can (lazily) correct for linkrev aliases
                          return self._adjustlinkrev(self._descendantrev)
                      else:
                          return self._filelog.linkrev(self._filerev)
                  @propertycache
                  def _filenode(self):
                      if '_fileid' in self.__dict__:
                          return self._filelog.lookup(self._fileid)
                      else:
                          return self._changectx.filenode(self._path)
                  @propertycache
                  def _filerev(self):
                      return self._filelog.rev(self._filenode)
                  @propertycache
                  def _repopath(self):
                      return self._path
                  def __nonzero__(self):
                      try:
                          self._filenode
                          return True
                      except error.LookupError:
                          # file is missing
                          return False
                  __bool__ = __nonzero__
                  def __bytes__(self):
                      try:
                          return b"%s@%s" % (self.path(), self._changectx)
                      except error.LookupError:
                          return b"%s@???" % self.path()
                  __str__ = encoding.strmethod(__bytes__)
                  def __repr__(self):
                      return "<%s %s>" % (type(self).__name__, str(self))
                  def __hash__(self):
                      try:
                          return hash((self._path, self._filenode))
                      except AttributeError:
                          return id(self)
                  def __eq__(self, other):
                      try:
                          return (
                              type(self) == type(other)
                              and self._path == other._path
                              and self._filenode == other._filenode
                          )
                      except AttributeError:
                          return False
                  def __ne__(self, other):
                      return not (self == other)
                  def filerev(self):
                      return self._filerev
                  def filenode(self):
                      return self._filenode
                  @propertycache
                  def _flags(self):
                      return self._changectx.flags(self._path)
                  def flags(self):
                      return self._flags
                  def filelog(self):
                      return self._filelog
                  def rev(self):
                      return self._changeid
                  def linkrev(self):
                      return self._filelog.linkrev(self._filerev)
                  def node(self):
                      return self._changectx.node()
                  def hex(self):
                      return self._changectx.hex()
                  def user(self):
                      return self._changectx.user()
                  def date(self):
                      return self._changectx.date()
                  def files(self):
                      return self._changectx.files()
                  def description(self):
                      return self._changectx.description()
                  def branch(self):
                      return self._changectx.branch()
                  def extra(self):
                      return self._changectx.extra()
                  def phase(self):
                      return self._changectx.phase()
                  def phasestr(self):
                      return self._changectx.phasestr()
                  def obsolete(self):
                      return self._changectx.obsolete()
                  def instabilities(self):
                      return self._changectx.instabilities()
                  def manifest(self):
                      return self._changectx.manifest()
                  def changectx(self):
                      return self._changectx
                  def renamed(self):
                      return self._copied
                  def copysource(self):
                      return self._copied and self._copied[0]
                  def repo(self):
                      return self._repo
                  def size(self):
                      return len(self.data())
                  def path(self):
                      return self._path
                  def isbinary(self):
                      try:
                          return stringutil.binary(self.data())
                      except IOError:
                          return False
                  def isexec(self):
                      return b'x' in self.flags()
                  def islink(self):
                      return b'l' in self.flags()
                  def isabsent(self):
                      """whether this filectx represents a file not in self._changectx
                      This is mainly for merge code to detect change/delete conflicts. This is
                      expected to be True for all subclasses of basectx."""
                      return False
                  _customcmp = False
                  def cmp(self, fctx):
                      """compare with other file context
                      returns True if different than fctx.
                      """
                      if fctx._customcmp:
                          return fctx.cmp(self)
                      if self._filenode is None:
                          raise error.ProgrammingError(
                              b'filectx.cmp() must be reimplemented if not backed by revlog'
                          )
                      if fctx._filenode is None:
                          if self._repo._encodefilterpats:
                              # can't rely on size() because wdir content may be decoded
                              return self._filelog.cmp(self._filenode, fctx.data())
                          if self.size() - 4 == fctx.size():
                              # size() can match:
                              # if file data starts with '\1\n', empty metadata block is
                              # prepended, which adds 4 bytes to filelog.size().
                              return self._filelog.cmp(self._filenode, fctx.data())
                      if self.size() == fctx.size() or self.flags() == b'l':
                          # size() matches: need to compare content
                          # issue6456: Always compare symlinks because size can represent
                          # encrypted string for EXT-4 encryption(fscrypt).
                          return self._filelog.cmp(self._filenode, fctx.data())
                      # size() differs
                      return True
                  def _adjustlinkrev(self, srcrev, inclusive=False, stoprev=None):
                      """return the first ancestor of <srcrev> introducing <fnode>
                      If the linkrev of the file revision does not point to an ancestor of
                      srcrev, we'll walk down the ancestors until we find one introducing
                      this file revision.
                      :srcrev: the changeset revision we search ancestors from
                      :inclusive: if true, the src revision will also be checked
                      :stoprev: an optional revision to stop the walk at. If no introduction
                                of this file content could be found before this floor
                                revision, the function will returns "None" and stops its
                                iteration.
                      """
                      repo = self._repo
                      cl = repo.unfiltered().changelog
                      mfl = repo.manifestlog
                      # fetch the linkrev
                      lkr = self.linkrev()
                      if srcrev == lkr:
                          return lkr
                      # hack to reuse ancestor computation when searching for renames
                      memberanc = getattr(self, '_ancestrycontext', None)
                      iteranc = None
                      if srcrev is None:
                          # wctx case, used by workingfilectx during mergecopy
                          revs = [p.rev() for p in self._repo[None].parents()]
                          inclusive = True  # we skipped the real (revless) source
                      else:
                          revs = [srcrev]
                      if memberanc is None:
                          memberanc = iteranc = cl.ancestors(revs, lkr, inclusive=inclusive)
                      # check if this linkrev is an ancestor of srcrev
                      if lkr not in memberanc:
                          if iteranc is None:
                              iteranc = cl.ancestors(revs, lkr, inclusive=inclusive)
                          fnode = self._filenode
                          path = self._path
                          for a in iteranc:
                              if stoprev is not None and a < stoprev:
                                  return None
                              ac = cl.read(a)  # get changeset data (we avoid object creation)
                              if path in ac[3]:  # checking the 'files' field.
                                  # The file has been touched, check if the content is
                                  # similar to the one we search for.
                                  if fnode == mfl[ac[0]].readfast().get(path):
                                      return a
                          # In theory, we should never get out of that loop without a result.
                          # But if manifest uses a buggy file revision (not children of the
                          # one it replaces) we could. Such a buggy situation will likely
                          # result is crash somewhere else at to some point.
                      return lkr
                  def isintroducedafter(self, changelogrev):
                      """True if a filectx has been introduced after a given floor revision"""
                      if self.linkrev() >= changelogrev:
                          return True
                      introrev = self._introrev(stoprev=changelogrev)
                      if introrev is None:
                          return False
                      return introrev >= changelogrev
                  def introrev(self):
                      """return the rev of the changeset which introduced this file revision
                      This method is different from linkrev because it take into account the
                      changeset the filectx was created from. It ensures the returned
                      revision is one of its ancestors. This prevents bugs from
                      'linkrev-shadowing' when a file revision is used by multiple
                      changesets.
                      """
                      return self._introrev()
                  def _introrev(self, stoprev=None):
                      """
                      Same as `introrev` but, with an extra argument to limit changelog
                      iteration range in some internal usecase.
                      If `stoprev` is set, the `introrev` will not be searched past that
                      `stoprev` revision and "None" might be returned. This is useful to
                      limit the iteration range.
                      """
                      toprev = None
                      attrs = vars(self)
                      if '_changeid' in attrs:
                          # We have a cached value already
                          toprev = self._changeid
                      elif '_changectx' in attrs:
                          # We know which changelog entry we are coming from
                          toprev = self._changectx.rev()
                      if toprev is not None:
                          return self._adjustlinkrev(toprev, inclusive=True, stoprev=stoprev)
                      elif '_descendantrev' in attrs:
                          introrev = self._adjustlinkrev(self._descendantrev, stoprev=stoprev)
                          # be nice and cache the result of the computation
                          if introrev is not None:
                              self._changeid = introrev
                          return introrev
                      else:
                          return self.linkrev()
                  def introfilectx(self):
                      """Return filectx having identical contents, but pointing to the
                      changeset revision where this filectx was introduced"""
                      introrev = self.introrev()
                      if self.rev() == introrev:
                          return self
                      return self.filectx(self.filenode(), changeid=introrev)
                  def _parentfilectx(self, path, fileid, filelog):
                      """create parent filectx keeping ancestry info for _adjustlinkrev()"""
                      fctx = filectx(self._repo, path, fileid=fileid, filelog=filelog)
                      if '_changeid' in vars(self) or '_changectx' in vars(self):
                          # If self is associated with a changeset (probably explicitly
                          # fed), ensure the created filectx is associated with a
                          # changeset that is an ancestor of self.changectx.
                          # This lets us later use _adjustlinkrev to get a correct link.
                          fctx._descendantrev = self.rev()
                          fctx._ancestrycontext = getattr(self, '_ancestrycontext', None)
                      elif '_descendantrev' in vars(self):
                          # Otherwise propagate _descendantrev if we have one associated.
                          fctx._descendantrev = self._descendantrev
                          fctx._ancestrycontext = getattr(self, '_ancestrycontext', None)
                      return fctx
                  def parents(self):
                      _path = self._path
                      fl = self._filelog
                      parents = self._filelog.parents(self._filenode)
                      pl = [
                          (_path, node, fl)
                          for node in parents
                          if node != self._repo.nodeconstants.nullid
                      ]
                      r = fl.renamed(self._filenode)
                      if r:
                          # - In the simple rename case, both parent are nullid, pl is empty.
                          # - In case of merge, only one of the parent is null id and should
                          # be replaced with the rename information. This parent is -always-
                          # the first one.
                          #
                          # As null id have always been filtered out in the previous list
                          # comprehension, inserting to 0 will always result in "replacing
                          # first nullid parent with rename information.
                          pl.insert(0, (r[0], r[1], self._repo.file(r[0])))
                      return [self._parentfilectx(path, fnode, l) for path, fnode, l in pl]
                  def p1(self):
                      return self.parents()[0]
                  def p2(self):
                      p = self.parents()
                      if len(p) == 2:
                          return p[1]
                      return filectx(self._repo, self._path, fileid=-1, filelog=self._filelog)
                  def annotate(self, follow=False, skiprevs=None, diffopts=None):
                      """Returns a list of annotateline objects for each line in the file
                      - line.fctx is the filectx of the node where that line was last changed
                      - line.lineno is the line number at the first appearance in the managed
                        file
                      - line.text is the data on that line (including newline character)
                      """
                      getlog = util.lrucachefunc(lambda x: self._repo.file(x))
                      def parents(f):
                          # Cut _descendantrev here to mitigate the penalty of lazy linkrev
                          # adjustment. Otherwise, p._adjustlinkrev() would walk changelog
                          # from the topmost introrev (= srcrev) down to p.linkrev() if it
                          # isn't an ancestor of the srcrev.
                          f._changeid
                          pl = f.parents()
                          # Don't return renamed parents if we aren't following.
                          if not follow:
                              pl = [p for p in pl if p.path() == f.path()]
                          # renamed filectx won't have a filelog yet, so set it
                          # from the cache to save time
                          for p in pl:
                              if not '_filelog' in p.__dict__:
                                  p._filelog = getlog(p.path())
                          return pl
                      # use linkrev to find the first changeset where self appeared
                      base = self.introfilectx()
                      if getattr(base, '_ancestrycontext', None) is None:
                          # it is safe to use an unfiltered repository here because we are
                          # walking ancestors only.
                          cl = self._repo.unfiltered().changelog
                          if base.rev() is None:
                              # wctx is not inclusive, but works because _ancestrycontext
                              # is used to test filelog revisions
                              ac = cl.ancestors(
                                  [p.rev() for p in base.parents()], inclusive=True
                              )
                          else:
                              ac = cl.ancestors([base.rev()], inclusive=True)
                          base._ancestrycontext = ac
                      return dagop.annotate(
                          base, parents, skiprevs=skiprevs, diffopts=diffopts
                      )
                  def ancestors(self, followfirst=False):
                      visit = {}
                      c = self
                      if followfirst:
                          cut = 1
                      else:
                          cut = None
                      while True:
                          for parent in c.parents()[:cut]:
                              visit[(parent.linkrev(), parent.filenode())] = parent
                          if not visit:
                              break
                          c = visit.pop(max(visit))
                          yield c
                  def decodeddata(self):
                      """Returns `data()` after running repository decoding filters.
                      This is often equivalent to how the data would be expressed on disk.
                      """
                      return self._repo.wwritedata(self.path(), self.data())
              class filectx(basefilectx):
                  """A filecontext object makes access to data related to a particular
                  filerevision convenient."""
                  def __init__(
                      self,
                      repo,
                      path,
                      changeid=None,
                      fileid=None,
                      filelog=None,
                      changectx=None,
                  ):
                      """changeid must be a revision number, if specified.
                      fileid can be a file revision or node."""
                      self._repo = repo
                      self._path = path
                      assert (
                          changeid is not None or fileid is not None or changectx is not None
                      ), b"bad args: changeid=%r, fileid=%r, changectx=%r" % (
                          changeid,
                          fileid,
                          changectx,
                      )
                      if filelog is not None:
                          self._filelog = filelog
                      if changeid is not None:
                          self._changeid = changeid
                      if changectx is not None:
                          self._changectx = changectx
                      if fileid is not None:
                          self._fileid = fileid
                  @propertycache
                  def _changectx(self):
                      try:
                          return self._repo[self._changeid]
                      except error.FilteredRepoLookupError:
                          # Linkrev may point to any revision in the repository.  When the
                          # repository is filtered this may lead to `filectx` trying to build
                          # `changectx` for filtered revision. In such case we fallback to
                          # creating `changectx` on the unfiltered version of the reposition.
                          # This fallback should not be an issue because `changectx` from
                          # `filectx` are not used in complex operations that care about
                          # filtering.
                          #
                          # This fallback is a cheap and dirty fix that prevent several
                          # crashes. It does not ensure the behavior is correct. However the
                          # behavior was not correct before filtering either and "incorrect
                          # behavior" is seen as better as "crash"
                          #
                          # Linkrevs have several serious troubles with filtering that are
                          # complicated to solve. Proper handling of the issue here should be
                          # considered when solving linkrev issue are on the table.
                          return self._repo.unfiltered()[self._changeid]
                  def filectx(self, fileid, changeid=None):
                      """opens an arbitrary revision of the file without
                      opening a new filelog"""
                      return filectx(
                          self._repo,
                          self._path,
                          fileid=fileid,
                          filelog=self._filelog,
                          changeid=changeid,
                      )
                  def rawdata(self):
                      return self._filelog.rawdata(self._filenode)
                  def rawflags(self):
                      """low-level revlog flags"""
                      return self._filelog.flags(self._filerev)
                  def data(self):
                      try:
                          return self._filelog.read(self._filenode)
                      except error.CensoredNodeError:
                          if self._repo.ui.config(b"censor", b"policy") == b"ignore":
                              return b""
                          raise error.Abort(
                              _(b"censored node: %s") % short(self._filenode),
                              hint=_(b"set censor.policy to ignore errors"),
                          )
                  def size(self):
                      return self._filelog.size(self._filerev)
                  @propertycache
                  def _copied(self):
                      """check if file was actually renamed in this changeset revision
                      If rename logged in file revision, we report copy for changeset only
                      if file revisions linkrev points back to the changeset in question
                      or both changeset parents contain different file revisions.
                      """
                      renamed = self._filelog.renamed(self._filenode)
                      if not renamed:
                          return None
                      if self.rev() == self.linkrev():
                          return renamed
                      name = self.path()
                      fnode = self._filenode
                      for p in self._changectx.parents():
                          try:
                              if fnode == p.filenode(name):
                                  return None
                          except error.LookupError:
                              pass
                      return renamed
                  def children(self):
                      # hard for renames
                      c = self._filelog.children(self._filenode)
                      return [
                          filectx(self._repo, self._path, fileid=x, filelog=self._filelog)
                          for x in c
                      ]
              class committablectx(basectx):
                  """A committablectx object provides common functionality for a context that
                  wants the ability to commit, e.g. workingctx or memctx."""
                  def __init__(
                      self,
                      repo,
                      text=b"",
                      user=None,
                      date=None,
                      extra=None,
                      changes=None,
                      branch=None,
                  ):
                      super(committablectx, self).__init__(repo)
                      self._rev = None
                      self._node = None
                      self._text = text
                      if date:
                          self._date = dateutil.parsedate(date)
                      if user:
                          self._user = user
                      if changes:
                          self._status = changes
                      self._extra = {}
                      if extra:
                          self._extra = extra.copy()
                      if branch is not None:
                          self._extra[b'branch'] = encoding.fromlocal(branch)
                      if not self._extra.get(b'branch'):
                          self._extra[b'branch'] = b'default'
                  def __bytes__(self):
                      return bytes(self._parents[0]) + b"+"
                  def hex(self):
                      self._repo.nodeconstants.wdirhex
                  __str__ = encoding.strmethod(__bytes__)
                  def __nonzero__(self):
                      return True
                  __bool__ = __nonzero__
                  @propertycache
                  def _status(self):
                      return self._repo.status()
                  @propertycache
                  def _user(self):
                      return self._repo.ui.username()
                  @propertycache
                  def _date(self):
                      ui = self._repo.ui
                      date = ui.configdate(b'devel', b'default-date')
                      if date is None:
                          date = dateutil.makedate()
                      return date
                  def subrev(self, subpath):
                      return None
                  def manifestnode(self):
                      return None
                  def user(self):
                      return self._user or self._repo.ui.username()
                  def date(self):
                      return self._date
                  def description(self):
                      return self._text
                  def files(self):
                      return sorted(
                          self._status.modified + self._status.added + self._status.removed
                      )
                  def modified(self):
                      return self._status.modified
                  def added(self):
                      return self._status.added
                  def removed(self):
                      return self._status.removed
                  def deleted(self):
                      return self._status.deleted
                  filesmodified = modified
                  filesadded = added
                  filesremoved = removed
                  def branch(self):
                      return encoding.tolocal(self._extra[b'branch'])
                  def closesbranch(self):
                      return b'close' in self._extra
                  def extra(self):
                      return self._extra
                  def isinmemory(self):
                      return False
                  def tags(self):
                      return []
                  def bookmarks(self):
                      b = []
                      for p in self.parents():
                          b.extend(p.bookmarks())
                      return b
                  def phase(self):
                      phase = phases.newcommitphase(self._repo.ui)
                      for p in self.parents():
                          phase = max(phase, p.phase())
                      return phase
                  def hidden(self):
                      return False
                  def children(self):
                      return []
                  def flags(self, path):
                      if '_manifest' in self.__dict__:
                          try:
                              return self._manifest.flags(path)
                          except KeyError:
                              return b''
                      try:
                          return self._flagfunc(path)
                      except OSError:
                          return b''
                  def ancestor(self, c2):
                      """return the "best" ancestor context of self and c2"""
                      return self._parents[0].ancestor(c2)  # punt on two parents for now
                  def ancestors(self):
                      for p in self._parents:
                          yield p
                      for a in self._repo.changelog.ancestors(
                          [p.rev() for p in self._parents]
                      ):
                          yield self._repo[a]
                  def markcommitted(self, node):
                      """Perform post-commit cleanup necessary after committing this ctx
                      Specifically, this updates backing stores this working context
                      wraps to reflect the fact that the changes reflected by this
                      workingctx have been committed.  For example, it marks
                      modified and added files as normal in the dirstate.
                      """
                  def dirty(self, missing=False, merge=True, branch=True):
                      return False
              class workingctx(committablectx):
                  """A workingctx object makes access to data related to
                  the current working directory convenient.
                  date - any valid date string or (unixtime, offset), or None.
                  user - username string, or None.
                  extra - a dictionary of extra values, or None.
                  changes - a list of file lists as returned by localrepo.status()
                             or None to use the repository status.
                  """
                  def __init__(
                      self, repo, text=b"", user=None, date=None, extra=None, changes=None
                  ):
                      branch = None
                      if not extra or b'branch' not in extra:
                          try:
                              branch = repo.dirstate.branch()
                          except UnicodeDecodeError:
                              raise error.Abort(_(b'branch name not in UTF-8!'))
                      super(workingctx, self).__init__(
                          repo, text, user, date, extra, changes, branch=branch
                      )
                  def __iter__(self):
                      d = self._repo.dirstate
                      for f in d:
                          if d[f] != b'r':
                              yield f
                  def __contains__(self, key):
                      return self._repo.dirstate[key] not in b"?r"
                  def hex(self):
                      return self._repo.nodeconstants.wdirhex
                  @propertycache
                  def _parents(self):
                      p = self._repo.dirstate.parents()
                      if p[1] == self._repo.nodeconstants.nullid:
                          p = p[:-1]
                      # use unfiltered repo to delay/avoid loading obsmarkers
                      unfi = self._repo.unfiltered()
                      return [
                          changectx(
                              self._repo, unfi.changelog.rev(n), n, maybe_filtered=False
                          )
                          for n in p
                      ]
                  def setparents(self, p1node, p2node=None):
                      if p2node is None:
                          p2node = self._repo.nodeconstants.nullid
                      dirstate = self._repo.dirstate
                      with dirstate.parentchange():
                          copies = dirstate.setparents(p1node, p2node)
                          pctx = self._repo[p1node]
                          if copies:
                              # Adjust copy records, the dirstate cannot do it, it
                              # requires access to parents manifests. Preserve them
                              # only for entries added to first parent.
                              for f in copies:
                                  if f not in pctx and copies[f] in pctx:
                                      dirstate.copy(copies[f], f)
                          if p2node == self._repo.nodeconstants.nullid:
                              for f, s in sorted(dirstate.copies().items()):
                                  if f not in pctx and s not in pctx:
                                      dirstate.copy(None, f)
                  def _fileinfo(self, path):
                      # populate __dict__['_manifest'] as workingctx has no _manifestdelta
                      self._manifest
                      return super(workingctx, self)._fileinfo(path)
                  def _buildflagfunc(self):
                      # Create a fallback function for getting file flags when the
                      # filesystem doesn't support them
                      copiesget = self._repo.dirstate.copies().get
                      parents = self.parents()
                      if len(parents) < 2:
                          # when we have one parent, it's easy: copy from parent
                          man = parents[0].manifest()
                          def func(f):
                              f = copiesget(f, f)
                              return man.flags(f)
                      else:
                          # merges are tricky: we try to reconstruct the unstored
                          # result from the merge (issue1802)
                          p1, p2 = parents
                          pa = p1.ancestor(p2)
                          m1, m2, ma = p1.manifest(), p2.manifest(), pa.manifest()
                          def func(f):
                              f = copiesget(f, f)  # may be wrong for merges with copies
                              fl1, fl2, fla = m1.flags(f), m2.flags(f), ma.flags(f)
                              if fl1 == fl2:
                                  return fl1
                              if fl1 == fla:
                                  return fl2
                              if fl2 == fla:
                                  return fl1
                              return b''  # punt for conflicts
                      return func
                  @propertycache
                  def _flagfunc(self):
                      return self._repo.dirstate.flagfunc(self._buildflagfunc)
                  def flags(self, path):
                      try:
                          return self._flagfunc(path)
                      except OSError:
                          return b''
                  def filectx(self, path, filelog=None):
                      """get a file context from the working directory"""
                      return workingfilectx(
                          self._repo, path, workingctx=self, filelog=filelog
                      )
                  def dirty(self, missing=False, merge=True, branch=True):
                      """check whether a working directory is modified"""
                      # check subrepos first
                      for s in sorted(self.substate):
                          if self.sub(s).dirty(missing=missing):
                              return True
                      # check current working dir
                      return (
                          (merge and self.p2())
                          or (branch and self.branch() != self.p1().branch())
                          or self.modified()
                          or self.added()
                          or self.removed()
                          or (missing and self.deleted())
                      )
                  def add(self, list, prefix=b""):
                      with self._repo.wlock():
                          ui, ds = self._repo.ui, self._repo.dirstate
                          uipath = lambda f: ds.pathto(pathutil.join(prefix, f))
                          rejected = []
                          lstat = self._repo.wvfs.lstat
                          for f in list:
                              # ds.pathto() returns an absolute file when this is invoked from
                              # the keyword extension.  That gets flagged as non-portable on
                              # Windows, since it contains the drive letter and colon.
                              scmutil.checkportable(ui, os.path.join(prefix, f))
                              try:
                                  st = lstat(f)
                              except OSError:
                                  ui.warn(_(b"%s does not exist!\n") % uipath(f))
                                  rejected.append(f)
                                  continue
                              limit = ui.configbytes(b'ui', b'large-file-limit')
                              if limit != 0 and st.st_size > limit:
                                  ui.warn(
                                      _(
                                          b"%s: up to %d MB of RAM may be required "
                                          b"to manage this file\n"
                                          b"(use 'hg revert %s' to cancel the "
                                          b"pending addition)\n"
                                      )
                                      % (f, 3 * st.st_size // 1000000, uipath(f))
                                  )
                              if not (stat.S_ISREG(st.st_mode) or stat.S_ISLNK(st.st_mode)):
                                  ui.warn(
                                      _(
                                          b"%s not added: only files and symlinks "
                                          b"supported currently\n"
                                      )
                                      % uipath(f)
                                  )
                                  rejected.append(f)
                              elif ds[f] in b'amn':
                                  ui.warn(_(b"%s already tracked!\n") % uipath(f))
                              elif ds[f] == b'r':
                                  ds.normallookup(f)
                              else:
                                  ds.add(f)
                          return rejected
                  def forget(self, files, prefix=b""):
                      with self._repo.wlock():
                          ds = self._repo.dirstate
                          uipath = lambda f: ds.pathto(pathutil.join(prefix, f))
                          rejected = []
                          for f in files:
                              if f not in ds:
                                  self._repo.ui.warn(_(b"%s not tracked!\n") % uipath(f))
                                  rejected.append(f)
                              elif ds[f] != b'a':
                                  ds.remove(f)
                              else:
                                  ds.drop(f)
                          return rejected
                  def copy(self, source, dest):
                      try:
                          st = self._repo.wvfs.lstat(dest)
                      except OSError as err:
                          if err.errno != errno.ENOENT:
                              raise
                          self._repo.ui.warn(
                              _(b"%s does not exist!\n") % self._repo.dirstate.pathto(dest)
                          )
                          return
                      if not (stat.S_ISREG(st.st_mode) or stat.S_ISLNK(st.st_mode)):
                          self._repo.ui.warn(
                              _(b"copy failed: %s is not a file or a symbolic link\n")
                              % self._repo.dirstate.pathto(dest)
                          )
                      else:
                          with self._repo.wlock():
                              ds = self._repo.dirstate
                              if ds[dest] in b'?':
                                  ds.add(dest)
                              elif ds[dest] in b'r':
                                  ds.normallookup(dest)
                              ds.copy(source, dest)
                  def match(
                      self,
                      pats=None,
                      include=None,
                      exclude=None,
                      default=b'glob',
                      listsubrepos=False,
                      badfn=None,
                      cwd=None,
                  ):
                      r = self._repo
                      if not cwd:
                          cwd = r.getcwd()
                      # Only a case insensitive filesystem needs magic to translate user input
                      # to actual case in the filesystem.
                      icasefs = not util.fscasesensitive(r.root)
                      return matchmod.match(
                          r.root,
                          cwd,
                          pats,
                          include,
                          exclude,
                          default,
                          auditor=r.auditor,
                          ctx=self,
                          listsubrepos=listsubrepos,
                          badfn=badfn,
                          icasefs=icasefs,
                      )
                  def _filtersuspectsymlink(self, files):
                      if not files or self._repo.dirstate._checklink:
                          return files
                      # Symlink placeholders may get non-symlink-like contents
                      # via user error or dereferencing by NFS or Samba servers,
                      # so we filter out any placeholders that don't look like a
                      # symlink
                      sane = []
                      for f in files:
                          if self.flags(f) == b'l':
                              d = self[f].data()
                              if (
                                  d == b''
                                  or len(d) >= 1024
                                  or b'\n' in d
                                  or stringutil.binary(d)
                              ):
                                  self._repo.ui.debug(
                                      b'ignoring suspect symlink placeholder "%s"\n' % f
                                  )
                                  continue
                          sane.append(f)
                      return sane
                  def _checklookup(self, files):
                      # check for any possibly clean files
                      if not files:
                          return [], [], []
                      modified = []
                      deleted = []
                      fixup = []
                      pctx = self._parents[0]
                      # do a full compare of any files that might have changed
                      for f in sorted(files):
                          try:
                              # This will return True for a file that got replaced by a
                              # directory in the interim, but fixing that is pretty hard.
                              if (
                                  f not in pctx
                                  or self.flags(f) != pctx.flags(f)
                                  or pctx[f].cmp(self[f])
                              ):
                                  modified.append(f)
                              else:
                                  fixup.append(f)
                          except (IOError, OSError):
                              # A file become inaccessible in between? Mark it as deleted,
                              # matching dirstate behavior (issue5584).
                              # The dirstate has more complex behavior around whether a
                              # missing file matches a directory, etc, but we don't need to
                              # bother with that: if f has made it to this point, we're sure
                              # it's in the dirstate.
                              deleted.append(f)
                      return modified, deleted, fixup
                  def _poststatusfixup(self, status, fixup):
                      """update dirstate for files that are actually clean"""
                      poststatus = self._repo.postdsstatus()
-                     if fixup or poststatus:
+                     if fixup or poststatus or self._repo.dirstate._dirty:
                          try:
                              oldid = self._repo.dirstate.identity()
                              # updating the dirstate is optional
                              # so we don't wait on the lock
                              # wlock can invalidate the dirstate, so cache normal _after_
                              # taking the lock
                              with self._repo.wlock(False):
                                  if self._repo.dirstate.identity() == oldid:
                                      if fixup:
                                          normal = self._repo.dirstate.normal
                                          for f in fixup:
                                              normal(f)
                                          # write changes out explicitly, because nesting
                                          # wlock at runtime may prevent 'wlock.release()'
                                          # after this block from doing so for subsequent
                                          # changing files
                                          tr = self._repo.currenttransaction()
                                          self._repo.dirstate.write(tr)
                                      if poststatus:
                                          for ps in poststatus:
                                              ps(self, status)
                                  else:
                                      # in this case, writing changes out breaks
                                      # consistency, because .hg/dirstate was
                                      # already changed simultaneously after last
                                      # caching (see also issue5584 for detail)
                                      self._repo.ui.debug(
                                          b'skip updating dirstate: identity mismatch\n'
                                      )
                          except error.LockError:
                              pass
                          finally:
                              # Even if the wlock couldn't be grabbed, clear out the list.
                              self._repo.clearpostdsstatus()
                  def _dirstatestatus(self, match, ignored=False, clean=False, unknown=False):
                      '''Gets the status from the dirstate -- internal use only.'''
                      subrepos = []
                      if b'.hgsub' in self:
                          subrepos = sorted(self.substate)
                      cmp, s = self._repo.dirstate.status(
                          match, subrepos, ignored=ignored, clean=clean, unknown=unknown
                      )
                      # check for any possibly clean files
                      fixup = []
                      if cmp:
                          modified2, deleted2, fixup = self._checklookup(cmp)
                          s.modified.extend(modified2)
                          s.deleted.extend(deleted2)
                          if fixup and clean:
                              s.clean.extend(fixup)
                      self._poststatusfixup(s, fixup)
                      if match.always():
                          # cache for performance
                          if s.unknown or s.ignored or s.clean:
                              # "_status" is cached with list*=False in the normal route
                              self._status = scmutil.status(
                                  s.modified, s.added, s.removed, s.deleted, [], [], []
                              )
                          else:
                              self._status = s
                      return s
                  @propertycache
                  def _copies(self):
                      p1copies = {}
                      p2copies = {}
                      parents = self._repo.dirstate.parents()
                      p1manifest = self._repo[parents[0]].manifest()
                      p2manifest = self._repo[parents[1]].manifest()
                      changedset = set(self.added()) | set(self.modified())
                      narrowmatch = self._repo.narrowmatch()
                      for dst, src in self._repo.dirstate.copies().items():
                          if dst not in changedset or not narrowmatch(dst):
                              continue
                          if src in p1manifest:
                              p1copies[dst] = src
                          elif src in p2manifest:
                              p2copies[dst] = src
                      return p1copies, p2copies
                  @propertycache
                  def _manifest(self):
                      """generate a manifest corresponding to the values in self._status
                      This reuse the file nodeid from parent, but we use special node
                      identifiers for added and modified files. This is used by manifests
                      merge to see that files are different and by update logic to avoid
                      deleting newly added files.
                      """
                      return self._buildstatusmanifest(self._status)
                  def _buildstatusmanifest(self, status):
                      """Builds a manifest that includes the given status results."""
                      parents = self.parents()
                      man = parents[0].manifest().copy()
                      ff = self._flagfunc
                      for i, l in (
                          (self._repo.nodeconstants.addednodeid, status.added),
                          (self._repo.nodeconstants.modifiednodeid, status.modified),
                      ):
                          for f in l:
                              man[f] = i
                              try:
                                  man.setflag(f, ff(f))
                              except OSError:
                                  pass
                      for f in status.deleted + status.removed:
                          if f in man:
                              del man[f]
                      return man
                  def _buildstatus(
                      self, other, s, match, listignored, listclean, listunknown
                  ):
                      """build a status with respect to another context
                      This includes logic for maintaining the fast path of status when
                      comparing the working directory against its parent, which is to skip
                      building a new manifest if self (working directory) is not comparing
                      against its parent (repo['.']).
                      """
                      s = self._dirstatestatus(match, listignored, listclean, listunknown)
                      # Filter out symlinks that, in the case of FAT32 and NTFS filesystems,
                      # might have accidentally ended up with the entire contents of the file
                      # they are supposed to be linking to.
                      s.modified[:] = self._filtersuspectsymlink(s.modified)
                      if other != self._repo[b'.']:
                          s = super(workingctx, self)._buildstatus(
                              other, s, match, listignored, listclean, listunknown
                          )
                      return s
                  def _matchstatus(self, other, match):
                      """override the match method with a filter for directory patterns
                      We use inheritance to customize the match.bad method only in cases of
                      workingctx since it belongs only to the working directory when
                      comparing against the parent changeset.
                      If we aren't comparing against the working directory's parent, then we
                      just use the default match object sent to us.
                      """
                      if other != self._repo[b'.']:
                          def bad(f, msg):
                              # 'f' may be a directory pattern from 'match.files()',
                              # so 'f not in ctx1' is not enough
                              if f not in other and not other.hasdir(f):
                                  self._repo.ui.warn(
                                      b'%s: %s\n' % (self._repo.dirstate.pathto(f), msg)
                                  )
                          match.bad = bad
                      return match
                  def walk(self, match):
                      '''Generates matching file names.'''
                      return sorted(
                          self._repo.dirstate.walk(
                              self._repo.narrowmatch(match),
                              subrepos=sorted(self.substate),
                              unknown=True,
                              ignored=False,
                          )
                      )
                  def matches(self, match):
                      match = self._repo.narrowmatch(match)
                      ds = self._repo.dirstate
                      return sorted(f for f in ds.matches(match) if ds[f] != b'r')
                  def markcommitted(self, node):
                      with self._repo.dirstate.parentchange():
                          for f in self.modified() + self.added():
                              self._repo.dirstate.normal(f)
                          for f in self.removed():
                              self._repo.dirstate.drop(f)
                          self._repo.dirstate.setparents(node)
                          self._repo._quick_access_changeid_invalidate()
                      # write changes out explicitly, because nesting wlock at
                      # runtime may prevent 'wlock.release()' in 'repo.commit()'
                      # from immediately doing so for subsequent changing files
                      self._repo.dirstate.write(self._repo.currenttransaction())
                      sparse.aftercommit(self._repo, node)
                  def mergestate(self, clean=False):
                      if clean:
                          return mergestatemod.mergestate.clean(self._repo)
                      return mergestatemod.mergestate.read(self._repo)
              class committablefilectx(basefilectx):
                  """A committablefilectx provides common functionality for a file context
                  that wants the ability to commit, e.g. workingfilectx or memfilectx."""
                  def __init__(self, repo, path, filelog=None, ctx=None):
                      self._repo = repo
                      self._path = path
                      self._changeid = None
                      self._filerev = self._filenode = None
                      if filelog is not None:
                          self._filelog = filelog
                      if ctx:
                          self._changectx = ctx
                  def __nonzero__(self):
                      return True
                  __bool__ = __nonzero__
                  def linkrev(self):
                      # linked to self._changectx no matter if file is modified or not
                      return self.rev()
                  def renamed(self):
                      path = self.copysource()
                      if not path:
                          return None
                      return (
                          path,
                          self._changectx._parents[0]._manifest.get(
                              path, self._repo.nodeconstants.nullid
                          ),
                      )
                  def parents(self):
                      '''return parent filectxs, following copies if necessary'''
                      def filenode(ctx, path):
                          return ctx._manifest.get(path, self._repo.nodeconstants.nullid)
                      path = self._path
                      fl = self._filelog
                      pcl = self._changectx._parents
                      renamed = self.renamed()
                      if renamed:
                          pl = [renamed + (None,)]
                      else:
                          pl = [(path, filenode(pcl[0], path), fl)]
                      for pc in pcl[1:]:
                          pl.append((path, filenode(pc, path), fl))
                      return [
                          self._parentfilectx(p, fileid=n, filelog=l)
                          for p, n, l in pl
                          if n != self._repo.nodeconstants.nullid
                      ]
                  def children(self):
                      return []
              class workingfilectx(committablefilectx):
                  """A workingfilectx object makes access to data related to a particular
                  file in the working directory convenient."""
                  def __init__(self, repo, path, filelog=None, workingctx=None):
                      super(workingfilectx, self).__init__(repo, path, filelog, workingctx)
                  @propertycache
                  def _changectx(self):
                      return workingctx(self._repo)
                  def data(self):
                      return self._repo.wread(self._path)
                  def copysource(self):
                      return self._repo.dirstate.copied(self._path)
                  def size(self):
                      return self._repo.wvfs.lstat(self._path).st_size
                  def lstat(self):
                      return self._repo.wvfs.lstat(self._path)
                  def date(self):
                      t, tz = self._changectx.date()
                      try:
                          return (self._repo.wvfs.lstat(self._path)[stat.ST_MTIME], tz)
                      except OSError as err:
                          if err.errno != errno.ENOENT:
                              raise
                          return (t, tz)
                  def exists(self):
                      return self._repo.wvfs.exists(self._path)
                  def lexists(self):
                      return self._repo.wvfs.lexists(self._path)
                  def audit(self):
                      return self._repo.wvfs.audit(self._path)
                  def cmp(self, fctx):
                      """compare with other file context
                      returns True if different than fctx.
                      """
                      # fctx should be a filectx (not a workingfilectx)
                      # invert comparison to reuse the same code path
                      return fctx.cmp(self)
                  def remove(self, ignoremissing=False):
                      """wraps unlink for a repo's working directory"""
                      rmdir = self._repo.ui.configbool(b'experimental', b'removeemptydirs')
                      self._repo.wvfs.unlinkpath(
                          self._path, ignoremissing=ignoremissing, rmdir=rmdir
                      )
                  def write(self, data, flags, backgroundclose=False, **kwargs):
                      """wraps repo.wwrite"""
                      return self._repo.wwrite(
                          self._path, data, flags, backgroundclose=backgroundclose, **kwargs
                      )
                  def markcopied(self, src):
                      """marks this file a copy of `src`"""
                      self._repo.dirstate.copy(src, self._path)
                  def clearunknown(self):
                      """Removes conflicting items in the working directory so that
                      ``write()`` can be called successfully.
                      """
                      wvfs = self._repo.wvfs
                      f = self._path
                      wvfs.audit(f)
                      if self._repo.ui.configbool(
                          b'experimental', b'merge.checkpathconflicts'
                      ):
                          # remove files under the directory as they should already be
                          # warned and backed up
                          if wvfs.isdir(f) and not wvfs.islink(f):
                              wvfs.rmtree(f, forcibly=True)
                          for p in reversed(list(pathutil.finddirs(f))):
                              if wvfs.isfileorlink(p):
                                  wvfs.unlink(p)
                                  break
                      else:
                          # don't remove files if path conflicts are not processed
                          if wvfs.isdir(f) and not wvfs.islink(f):
                              wvfs.removedirs(f)
                  def setflags(self, l, x):
                      self._repo.wvfs.setflags(self._path, l, x)
              class overlayworkingctx(committablectx):
                  """Wraps another mutable context with a write-back cache that can be
                  converted into a commit context.
                  self._cache[path] maps to a dict with keys: {
                      'exists': bool?
                      'date': date?
                      'data': str?
                      'flags': str?
                      'copied': str? (path or None)
                  }
                  If `exists` is True, `flags` must be non-None and 'date' is non-None. If it
                  is `False`, the file was deleted.
                  """
                  def __init__(self, repo):
                      super(overlayworkingctx, self).__init__(repo)
                      self.clean()
                  def setbase(self, wrappedctx):
                      self._wrappedctx = wrappedctx
                      self._parents = [wrappedctx]
                      # Drop old manifest cache as it is now out of date.
                      # This is necessary when, e.g., rebasing several nodes with one
                      # ``overlayworkingctx`` (e.g. with --collapse).
                      util.clearcachedproperty(self, b'_manifest')
                  def setparents(self, p1node, p2node=None):
                      if p2node is None:
                          p2node = self._repo.nodeconstants.nullid
                      assert p1node == self._wrappedctx.node()
                      self._parents = [self._wrappedctx, self._repo.unfiltered()[p2node]]
                  def data(self, path):
                      if self.isdirty(path):
                          if self._cache[path][b'exists']:
                              if self._cache[path][b'data'] is not None:
                                  return self._cache[path][b'data']
                              else:
                                  # Must fallback here, too, because we only set flags.
                                  return self._wrappedctx[path].data()
                          else:
                              raise error.ProgrammingError(
                                  b"No such file or directory: %s" % path
                              )
                      else:
                          return self._wrappedctx[path].data()
                  @propertycache
                  def _manifest(self):
                      parents = self.parents()
                      man = parents[0].manifest().copy()
                      flag = self._flagfunc
                      for path in self.added():
                          man[path] = self._repo.nodeconstants.addednodeid
                          man.setflag(path, flag(path))
                      for path in self.modified():
                          man[path] = self._repo.nodeconstants.modifiednodeid
                          man.setflag(path, flag(path))
                      for path in self.removed():
                          del man[path]
                      return man
                  @propertycache
                  def _flagfunc(self):
                      def f(path):
                          return self._cache[path][b'flags']
                      return f
                  def files(self):
                      return sorted(self.added() + self.modified() + self.removed())
                  def modified(self):
                      return [
                          f
                          for f in self._cache.keys()
                          if self._cache[f][b'exists'] and self._existsinparent(f)
                      ]
                  def added(self):
                      return [
                          f
                          for f in self._cache.keys()
                          if self._cache[f][b'exists'] and not self._existsinparent(f)
                      ]
                  def removed(self):
                      return [
                          f
                          for f in self._cache.keys()
                          if not self._cache[f][b'exists'] and self._existsinparent(f)
                      ]
                  def p1copies(self):
                      copies = {}
                      narrowmatch = self._repo.narrowmatch()
                      for f in self._cache.keys():
                          if not narrowmatch(f):
                              continue
                          copies.pop(f, None)  # delete if it exists
                          source = self._cache[f][b'copied']
                          if source:
                              copies[f] = source
                      return copies
                  def p2copies(self):
                      copies = {}
                      narrowmatch = self._repo.narrowmatch()
                      for f in self._cache.keys():
                          if not narrowmatch(f):
                              continue
                          copies.pop(f, None)  # delete if it exists
                          source = self._cache[f][b'copied']
                          if source:
                              copies[f] = source
                      return copies
                  def isinmemory(self):
                      return True
                  def filedate(self, path):
                      if self.isdirty(path):
                          return self._cache[path][b'date']
                      else:
                          return self._wrappedctx[path].date()
                  def markcopied(self, path, origin):
                      self._markdirty(
                          path,
                          exists=True,
                          date=self.filedate(path),
                          flags=self.flags(path),
                          copied=origin,
                      )
                  def copydata(self, path):
                      if self.isdirty(path):
                          return self._cache[path][b'copied']
                      else:
                          return None
                  def flags(self, path):
                      if self.isdirty(path):
                          if self._cache[path][b'exists']:
                              return self._cache[path][b'flags']
                          else:
                              raise error.ProgrammingError(
                                  b"No such file or directory: %s" % path
                              )
                      else:
                          return self._wrappedctx[path].flags()
                  def __contains__(self, key):
                      if key in self._cache:
                          return self._cache[key][b'exists']
                      return key in self.p1()
                  def _existsinparent(self, path):
                      try:
                          # ``commitctx` raises a ``ManifestLookupError`` if a path does not
                          # exist, unlike ``workingctx``, which returns a ``workingfilectx``
                          # with an ``exists()`` function.
                          self._wrappedctx[path]
                          return True
                      except error.ManifestLookupError:
                          return False
                  def _auditconflicts(self, path):
                      """Replicates conflict checks done by wvfs.write().
                      Since we never write to the filesystem and never call `applyupdates` in
                      IMM, we'll never check that a path is actually writable -- e.g., because
                      it adds `a/foo`, but `a` is actually a file in the other commit.
                      """
                      def fail(path, component):
                          # p1() is the base and we're receiving "writes" for p2()'s
                          # files.
                          if b'l' in self.p1()[component].flags():
                              raise error.Abort(
                                  b"error: %s conflicts with symlink %s "
                                  b"in %d." % (path, component, self.p1().rev())
                              )
                          else:
                              raise error.Abort(
                                  b"error: '%s' conflicts with file '%s' in "
                                  b"%d." % (path, component, self.p1().rev())
                              )
                      # Test that each new directory to be created to write this path from p2
                      # is not a file in p1.
                      components = path.split(b'/')
                      for i in pycompat.xrange(len(components)):
                          component = b"/".join(components[0:i])
                          if component in self:
                              fail(path, component)
                      # Test the other direction -- that this path from p2 isn't a directory
                      # in p1 (test that p1 doesn't have any paths matching `path/*`).
                      match = self.match([path], default=b'path')
                      mfiles = list(self.p1().manifest().walk(match))
                      if len(mfiles) > 0:
                          if len(mfiles) == 1 and mfiles[0] == path:
                              return
                          # omit the files which are deleted in current IMM wctx
                          mfiles = [m for m in mfiles if m in self]
                          if not mfiles:
                              return
                          raise error.Abort(
                              b"error: file '%s' cannot be written because "
                              b" '%s/' is a directory in %s (containing %d "
                              b"entries: %s)"
                              % (path, path, self.p1(), len(mfiles), b', '.join(mfiles))
                          )
                  def write(self, path, data, flags=b'', **kwargs):
                      if data is None:
                          raise error.ProgrammingError(b"data must be non-None")
                      self._auditconflicts(path)
                      self._markdirty(
                          path, exists=True, data=data, date=dateutil.makedate(), flags=flags
                      )
                  def setflags(self, path, l, x):
                      flag = b''
                      if l:
                          flag = b'l'
                      elif x:
                          flag = b'x'
                      self._markdirty(path, exists=True, date=dateutil.makedate(), flags=flag)
                  def remove(self, path):
                      self._markdirty(path, exists=False)
                  def exists(self, path):
                      """exists behaves like `lexists`, but needs to follow symlinks and
                      return False if they are broken.
                      """
                      if self.isdirty(path):
                          # If this path exists and is a symlink, "follow" it by calling
                          # exists on the destination path.
                          if (
                              self._cache[path][b'exists']
                              and b'l' in self._cache[path][b'flags']
                          ):
                              return self.exists(self._cache[path][b'data'].strip())
                          else:
                              return self._cache[path][b'exists']
                      return self._existsinparent(path)
                  def lexists(self, path):
                      """lexists returns True if the path exists"""
                      if self.isdirty(path):
                          return self._cache[path][b'exists']
                      return self._existsinparent(path)
                  def size(self, path):
                      if self.isdirty(path):
                          if self._cache[path][b'exists']:
                              return len(self._cache[path][b'data'])
                          else:
                              raise error.ProgrammingError(
                                  b"No such file or directory: %s" % path
                              )
                      return self._wrappedctx[path].size()
                  def tomemctx(
                      self,
                      text,
                      branch=None,
                      extra=None,
                      date=None,
                      parents=None,
                      user=None,
                      editor=None,
                  ):
                      """Converts this ``overlayworkingctx`` into a ``memctx`` ready to be
                      committed.
                      ``text`` is the commit message.
                      ``parents`` (optional) are rev numbers.
                      """
                      # Default parents to the wrapped context if not passed.
                      if parents is None:
                          parents = self.parents()
                          if len(parents) == 1:
                              parents = (parents[0], None)
                      # ``parents`` is passed as rev numbers; convert to ``commitctxs``.
                      if parents[1] is None:
                          parents = (self._repo[parents[0]], None)
                      else:
                          parents = (self._repo[parents[0]], self._repo[parents[1]])
                      files = self.files()
                      def getfile(repo, memctx, path):
                          if self._cache[path][b'exists']:
                              return memfilectx(
                                  repo,
                                  memctx,
                                  path,
                                  self._cache[path][b'data'],
                                  b'l' in self._cache[path][b'flags'],
                                  b'x' in self._cache[path][b'flags'],
                                  self._cache[path][b'copied'],
                              )
                          else:
                              # Returning None, but including the path in `files`, is
                              # necessary for memctx to register a deletion.
                              return None
                      if branch is None:
                          branch = self._wrappedctx.branch()
                      return memctx(
                          self._repo,
                          parents,
                          text,
                          files,
                          getfile,
                          date=date,
                          extra=extra,
                          user=user,
                          branch=branch,
                          editor=editor,
                      )
                  def tomemctx_for_amend(self, precursor):
                      extra = precursor.extra().copy()
                      extra[b'amend_source'] = precursor.hex()
                      return self.tomemctx(
                          text=precursor.description(),
                          branch=precursor.branch(),
                          extra=extra,
                          date=precursor.date(),
                          user=precursor.user(),
                      )
                  def isdirty(self, path):
                      return path in self._cache
                  def clean(self):
                      self._mergestate = None
                      self._cache = {}
                  def _compact(self):
                      """Removes keys from the cache that are actually clean, by comparing
                      them with the underlying context.
                      This can occur during the merge process, e.g. by passing --tool :local
                      to resolve a conflict.
                      """
                      keys = []
                      # This won't be perfect, but can help performance significantly when
                      # using things like remotefilelog.
                      scmutil.prefetchfiles(
                          self.repo(),
                          [
                              (
                                  self.p1().rev(),
                                  scmutil.matchfiles(self.repo(), self._cache.keys()),
                              )
                          ],
                      )
                      for path in self._cache.keys():
                          cache = self._cache[path]
                          try:
                              underlying = self._wrappedctx[path]
                              if (
                                  underlying.data() == cache[b'data']
                                  and underlying.flags() == cache[b'flags']
                              ):
                                  keys.append(path)
                          except error.ManifestLookupError:
                              # Path not in the underlying manifest (created).
                              continue
                      for path in keys:
                          del self._cache[path]
                      return keys
                  def _markdirty(
                      self, path, exists, data=None, date=None, flags=b'', copied=None
                  ):
                      # data not provided, let's see if we already have some; if not, let's
                      # grab it from our underlying context, so that we always have data if
                      # the file is marked as existing.
                      if exists and data is None:
                          oldentry = self._cache.get(path) or {}
                          data = oldentry.get(b'data')
                          if data is None:
                              data = self._wrappedctx[path].data()
                      self._cache[path] = {
                          b'exists': exists,
                          b'data': data,
                          b'date': date,
                          b'flags': flags,
                          b'copied': copied,
                      }
                      util.clearcachedproperty(self, b'_manifest')
                  def filectx(self, path, filelog=None):
                      return overlayworkingfilectx(
                          self._repo, path, parent=self, filelog=filelog
                      )
                  def mergestate(self, clean=False):
                      if clean or self._mergestate is None:
                          self._mergestate = mergestatemod.memmergestate(self._repo)
                      return self._mergestate
              class overlayworkingfilectx(committablefilectx):
                  """Wrap a ``workingfilectx`` but intercepts all writes into an in-memory
                  cache, which can be flushed through later by calling ``flush()``."""
                  def __init__(self, repo, path, filelog=None, parent=None):
                      super(overlayworkingfilectx, self).__init__(repo, path, filelog, parent)
                      self._repo = repo
                      self._parent = parent
                      self._path = path
                  def cmp(self, fctx):
                      return self.data() != fctx.data()
                  def changectx(self):
                      return self._parent
                  def data(self):
                      return self._parent.data(self._path)
                  def date(self):
                      return self._parent.filedate(self._path)
                  def exists(self):
                      return self.lexists()
                  def lexists(self):
                      return self._parent.exists(self._path)
                  def copysource(self):
                      return self._parent.copydata(self._path)
                  def size(self):
                      return self._parent.size(self._path)
                  def markcopied(self, origin):
                      self._parent.markcopied(self._path, origin)
                  def audit(self):
                      pass
                  def flags(self):
                      return self._parent.flags(self._path)
                  def setflags(self, islink, isexec):
                      return self._parent.setflags(self._path, islink, isexec)
                  def write(self, data, flags, backgroundclose=False, **kwargs):
                      return self._parent.write(self._path, data, flags, **kwargs)
                  def remove(self, ignoremissing=False):
                      return self._parent.remove(self._path)
                  def clearunknown(self):
                      pass
              class workingcommitctx(workingctx):
                  """A workingcommitctx object makes access to data related to
                  the revision being committed convenient.
                  This hides changes in the working directory, if they aren't
                  committed in this context.
                  """
                  def __init__(
                      self, repo, changes, text=b"", user=None, date=None, extra=None
                  ):
                      super(workingcommitctx, self).__init__(
                          repo, text, user, date, extra, changes
                      )
                  def _dirstatestatus(self, match, ignored=False, clean=False, unknown=False):
                      """Return matched files only in ``self._status``
                      Uncommitted files appear "clean" via this context, even if
                      they aren't actually so in the working directory.
                      """
                      if clean:
                          clean = [f for f in self._manifest if f not in self._changedset]
                      else:
                          clean = []
                      return scmutil.status(
                          [f for f in self._status.modified if match(f)],
                          [f for f in self._status.added if match(f)],
                          [f for f in self._status.removed if match(f)],
                          [],
                          [],
                          [],
                          clean,
                      )
                  @propertycache
                  def _changedset(self):
                      """Return the set of files changed in this context"""
                      changed = set(self._status.modified)
                      changed.update(self._status.added)
                      changed.update(self._status.removed)
                      return changed
              def makecachingfilectxfn(func):
                  """Create a filectxfn that caches based on the path.
                  We can't use util.cachefunc because it uses all arguments as the cache
                  key and this creates a cycle since the arguments include the repo and
                  memctx.
                  """
                  cache = {}
                  def getfilectx(repo, memctx, path):
                      if path not in cache:
                          cache[path] = func(repo, memctx, path)
                      return cache[path]
                  return getfilectx
              def memfilefromctx(ctx):
                  """Given a context return a memfilectx for ctx[path]
                  This is a convenience method for building a memctx based on another
                  context.
                  """
                  def getfilectx(repo, memctx, path):
                      fctx = ctx[path]
                      copysource = fctx.copysource()
                      return memfilectx(
                          repo,
                          memctx,
                          path,
                          fctx.data(),
                          islink=fctx.islink(),
                          isexec=fctx.isexec(),
                          copysource=copysource,
                      )
                  return getfilectx
              def memfilefrompatch(patchstore):
                  """Given a patch (e.g. patchstore object) return a memfilectx
                  This is a convenience method for building a memctx based on a patchstore.
                  """
                  def getfilectx(repo, memctx, path):
                      data, mode, copysource = patchstore.getfile(path)
                      if data is None:
                          return None
                      islink, isexec = mode
                      return memfilectx(
                          repo,
                          memctx,
                          path,
                          data,
                          islink=islink,
                          isexec=isexec,
                          copysource=copysource,
                      )
                  return getfilectx
              class memctx(committablectx):
                  """Use memctx to perform in-memory commits via localrepo.commitctx().
                  Revision information is supplied at initialization time while
                  related files data and is made available through a callback
                  mechanism.  'repo' is the current localrepo, 'parents' is a
                  sequence of two parent revisions identifiers (pass None for every
                  missing parent), 'text' is the commit message and 'files' lists
                  names of files touched by the revision (normalized and relative to
                  repository root).
                  filectxfn(repo, memctx, path) is a callable receiving the
                  repository, the current memctx object and the normalized path of
                  requested file, relative to repository root. It is fired by the
                  commit function for every file in 'files', but calls order is
                  undefined. If the file is available in the revision being
                  committed (updated or added), filectxfn returns a memfilectx
                  object. If the file was removed, filectxfn return None for recent
                  Mercurial. Moved files are represented by marking the source file
                  removed and the new file added with copy information (see
                  memfilectx).
                  user receives the committer name and defaults to current
                  repository username, date is the commit date in any format
                  supported by dateutil.parsedate() and defaults to current date, extra
                  is a dictionary of metadata or is left empty.
                  """
                  # Mercurial <= 3.1 expects the filectxfn to raise IOError for missing files.
                  # Extensions that need to retain compatibility across Mercurial 3.1 can use
                  # this field to determine what to do in filectxfn.
                  _returnnoneformissingfiles = True
                  def __init__(
                      self,
                      repo,
                      parents,
                      text,
                      files,
                      filectxfn,
                      user=None,
                      date=None,
                      extra=None,
                      branch=None,
                      editor=None,
                  ):
                      super(memctx, self).__init__(
                          repo, text, user, date, extra, branch=branch
                      )
                      self._rev = None
                      self._node = None
                      parents = [(p or self._repo.nodeconstants.nullid) for p in parents]
                      p1, p2 = parents
                      self._parents = [self._repo[p] for p in (p1, p2)]
                      files = sorted(set(files))
                      self._files = files
                      self.substate = {}
                      if isinstance(filectxfn, patch.filestore):
                          filectxfn = memfilefrompatch(filectxfn)
                      elif not callable(filectxfn):
                          # if store is not callable, wrap it in a function
                          filectxfn = memfilefromctx(filectxfn)
                      # memoizing increases performance for e.g. vcs convert scenarios.
                      self._filectxfn = makecachingfilectxfn(filectxfn)
                      if editor:
                          self._text = editor(self._repo, self, [])
                          self._repo.savecommitmessage(self._text)
                  def filectx(self, path, filelog=None):
                      """get a file context from the working directory
                      Returns None if file doesn't exist and should be removed."""
                      return self._filectxfn(self._repo, self, path)
                  def commit(self):
                      """commit context to the repo"""
                      return self._repo.commitctx(self)
                  @propertycache
                  def _manifest(self):
                      """generate a manifest based on the return values of filectxfn"""
                      # keep this simple for now; just worry about p1
                      pctx = self._parents[0]
                      man = pctx.manifest().copy()
                      for f in self._status.modified:
                          man[f] = self._repo.nodeconstants.modifiednodeid
                      for f in self._status.added:
                          man[f] = self._repo.nodeconstants.addednodeid
                      for f in self._status.removed:
                          if f in man:
                              del man[f]
                      return man
                  @propertycache
                  def _status(self):
                      """Calculate exact status from ``files`` specified at construction"""
                      man1 = self.p1().manifest()
                      p2 = self._parents[1]
                      # "1 < len(self._parents)" can't be used for checking
                      # existence of the 2nd parent, because "memctx._parents" is
                      # explicitly initialized by the list, of which length is 2.
                      if p2.rev() != nullrev:
                          man2 = p2.manifest()
                          managing = lambda f: f in man1 or f in man2
                      else:
                          managing = lambda f: f in man1
                      modified, added, removed = [], [], []
                      for f in self._files:
                          if not managing(f):
                              added.append(f)
                          elif self[f]:
                              modified.append(f)
                          else:
                              removed.append(f)
                      return scmutil.status(modified, added, removed, [], [], [], [])
                  def parents(self):
                      if self._parents[1].rev() == nullrev:
                          return [self._parents[0]]
                      return self._parents
              class memfilectx(committablefilectx):
                  """memfilectx represents an in-memory file to commit.
                  See memctx and committablefilectx for more details.
                  """
                  def __init__(
                      self,
                      repo,
                      changectx,
                      path,
                      data,
                      islink=False,
                      isexec=False,
                      copysource=None,
                  ):
                      """
                      path is the normalized file path relative to repository root.
                      data is the file content as a string.
                      islink is True if the file is a symbolic link.
                      isexec is True if the file is executable.
                      copied is the source file path if current file was copied in the
                      revision being committed, or None."""
                      super(memfilectx, self).__init__(repo, path, None, changectx)
                      self._data = data
                      if islink:
                          self._flags = b'l'
                      elif isexec:
                          self._flags = b'x'
                      else:
                          self._flags = b''
                      self._copysource = copysource
                  def copysource(self):
                      return self._copysource
                  def cmp(self, fctx):
                      return self.data() != fctx.data()
                  def data(self):
                      return self._data
                  def remove(self, ignoremissing=False):
                      """wraps unlink for a repo's working directory"""
                      # need to figure out what to do here
                      del self._changectx[self._path]
                  def write(self, data, flags, **kwargs):
                      """wraps repo.wwrite"""
                      self._data = data
              class metadataonlyctx(committablectx):
                  """Like memctx but it's reusing the manifest of different commit.
                  Intended to be used by lightweight operations that are creating
                  metadata-only changes.
                  Revision information is supplied at initialization time.  'repo' is the
                  current localrepo, 'ctx' is original revision which manifest we're reuisng
                  'parents' is a sequence of two parent revisions identifiers (pass None for
                  every missing parent), 'text' is the commit.
                  user receives the committer name and defaults to current repository
                  username, date is the commit date in any format supported by
                  dateutil.parsedate() and defaults to current date, extra is a dictionary of
                  metadata or is left empty.
                  """
                  def __init__(
                      self,
                      repo,
                      originalctx,
                      parents=None,
                      text=None,
                      user=None,
                      date=None,
                      extra=None,
                      editor=None,
                  ):
                      if text is None:
                          text = originalctx.description()
                      super(metadataonlyctx, self).__init__(repo, text, user, date, extra)
                      self._rev = None
                      self._node = None
                      self._originalctx = originalctx
                      self._manifestnode = originalctx.manifestnode()
                      if parents is None:
                          parents = originalctx.parents()
                      else:
                          parents = [repo[p] for p in parents if p is not None]
                      parents = parents[:]
                      while len(parents) < 2:
                          parents.append(repo[nullrev])
                      p1, p2 = self._parents = parents
                      # sanity check to ensure that the reused manifest parents are
                      # manifests of our commit parents
                      mp1, mp2 = self.manifestctx().parents
                      if p1 != self._repo.nodeconstants.nullid and p1.manifestnode() != mp1:
                          raise RuntimeError(
                              r"can't reuse the manifest: its p1 "
                              r"doesn't match the new ctx p1"
                          )
                      if p2 != self._repo.nodeconstants.nullid and p2.manifestnode() != mp2:
                          raise RuntimeError(
                              r"can't reuse the manifest: "
                              r"its p2 doesn't match the new ctx p2"
                          )
                      self._files = originalctx.files()
                      self.substate = {}
                      if editor:
                          self._text = editor(self._repo, self, [])
                          self._repo.savecommitmessage(self._text)
                  def manifestnode(self):
                      return self._manifestnode
                  @property
                  def _manifestctx(self):
                      return self._repo.manifestlog[self._manifestnode]
                  def filectx(self, path, filelog=None):
                      return self._originalctx.filectx(path, filelog=filelog)
                  def commit(self):
                      """commit context to the repo"""
                      return self._repo.commitctx(self)
                  @property
                  def _manifest(self):
                      return self._originalctx.manifest()
                  @propertycache
                  def _status(self):
                      """Calculate exact status from ``files`` specified in the ``origctx``
                      and parents manifests.
                      """
                      man1 = self.p1().manifest()
                      p2 = self._parents[1]
                      # "1 < len(self._parents)" can't be used for checking
                      # existence of the 2nd parent, because "metadataonlyctx._parents" is
                      # explicitly initialized by the list, of which length is 2.
                      if p2.rev() != nullrev:
                          man2 = p2.manifest()
                          managing = lambda f: f in man1 or f in man2
                      else:
                          managing = lambda f: f in man1
                      modified, added, removed = [], [], []
                      for f in self._files:
                          if not managing(f):
                              added.append(f)
                          elif f in self:
                              modified.append(f)
                          else:
                              removed.append(f)
                      return scmutil.status(modified, added, removed, [], [], [], [])
              class arbitraryfilectx(object):
                  """Allows you to use filectx-like functions on a file in an arbitrary
                  location on disk, possibly not in the working directory.
                  """
                  def __init__(self, path, repo=None):
                      # Repo is optional because contrib/simplemerge uses this class.
                      self._repo = repo
                      self._path = path
                  def cmp(self, fctx):
                      # filecmp follows symlinks whereas `cmp` should not, so skip the fast
                      # path if either side is a symlink.
                      symlinks = b'l' in self.flags() or b'l' in fctx.flags()
                      if not symlinks and isinstance(fctx, workingfilectx) and self._repo:
                          # Add a fast-path for merge if both sides are disk-backed.
                          # Note that filecmp uses the opposite return values (True if same)
                          # from our cmp functions (True if different).
                          return not filecmp.cmp(self.path(), self._repo.wjoin(fctx.path()))
                      return self.data() != fctx.data()
                  def path(self):
                      return self._path
                  def flags(self):
                      return b''
                  def data(self):
                      return util.readfile(self._path)
                  def decodeddata(self):
                      with open(self._path, b"rb") as f:
                          return f.read()
                  def remove(self):
                      util.unlink(self._path)
                  def write(self, data, flags, **kwargs):
                      assert not flags
                      with open(self._path, b"wb") as f:
                          f.write(data)

mercurial/dirstate.py

0 +3 0

              # dirstate.py - working directory tracking for mercurial
              #
              # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import collections
              import contextlib
              import errno
              import os
              import stat
              from .i18n import _
              from .pycompat import delattr
              from hgdemandimport import tracing
              from . import (
                  encoding,
                  error,
                  match as matchmod,
                  pathutil,
                  policy,
                  pycompat,
                  scmutil,
                  sparse,
                  txnutil,
                  util,
              )
              from .interfaces import (
                  dirstate as intdirstate,
                  util as interfaceutil,
              )
              parsers = policy.importmod('parsers')
              rustmod = policy.importrust('dirstate')
              SUPPORTS_DIRSTATE_V2 = rustmod is not None
              propertycache = util.propertycache
              filecache = scmutil.filecache
              _rangemask = 0x7FFFFFFF
              dirstatetuple = parsers.dirstatetuple
              class repocache(filecache):
                  """filecache for files in .hg/"""
                  def join(self, obj, fname):
                      return obj._opener.join(fname)
              class rootcache(filecache):
                  """filecache for files in the repository root"""
                  def join(self, obj, fname):
                      return obj._join(fname)
              def _getfsnow(vfs):
                  '''Get "now" timestamp on filesystem'''
                  tmpfd, tmpname = vfs.mkstemp()
                  try:
                      return os.fstat(tmpfd)[stat.ST_MTIME]
                  finally:
                      os.close(tmpfd)
                      vfs.unlink(tmpname)
              @interfaceutil.implementer(intdirstate.idirstate)
              class dirstate(object):
                  def __init__(
                      self,
                      opener,
                      ui,
                      root,
                      validate,
                      sparsematchfn,
                      nodeconstants,
                      use_dirstate_v2,
                  ):
                      """Create a new dirstate object.
                      opener is an open()-like callable that can be used to open the
                      dirstate file; root is the root of the directory tracked by
                      the dirstate.
                      """
                      self._use_dirstate_v2 = use_dirstate_v2
                      self._nodeconstants = nodeconstants
                      self._opener = opener
                      self._validate = validate
                      self._root = root
                      self._sparsematchfn = sparsematchfn
                      # ntpath.join(root, '') of Python 2.7.9 does not add sep if root is
                      # UNC path pointing to root share (issue4557)
                      self._rootdir = pathutil.normasprefix(root)
                      self._dirty = False
                      self._lastnormaltime = 0
                      self._ui = ui
                      self._filecache = {}
                      self._parentwriters = 0
                      self._filename = b'dirstate'
                      self._pendingfilename = b'%s.pending' % self._filename
                      self._plchangecallbacks = {}
                      self._origpl = None
                      self._updatedfiles = set()
                      self._mapcls = dirstatemap
                      # Access and cache cwd early, so we don't access it for the first time
                      # after a working-copy update caused it to not exist (accessing it then
                      # raises an exception).
                      self._cwd
                  def prefetch_parents(self):
                      """make sure the parents are loaded
                      Used to avoid a race condition.
                      """
                      self._pl
                  @contextlib.contextmanager
                  def parentchange(self):
                      """Context manager for handling dirstate parents.
                      If an exception occurs in the scope of the context manager,
                      the incoherent dirstate won't be written when wlock is
                      released.
                      """
                      self._parentwriters += 1
                      yield
                      # Typically we want the "undo" step of a context manager in a
                      # finally block so it happens even when an exception
                      # occurs. In this case, however, we only want to decrement
                      # parentwriters if the code in the with statement exits
                      # normally, so we don't have a try/finally here on purpose.
                      self._parentwriters -= 1
                  def pendingparentchange(self):
                      """Returns true if the dirstate is in the middle of a set of changes
                      that modify the dirstate parent.
                      """
                      return self._parentwriters > 0
                  @propertycache
                  def _map(self):
                      """Return the dirstate contents (see documentation for dirstatemap)."""
                      self._map = self._mapcls(
                          self._ui,
                          self._opener,
                          self._root,
                          self._nodeconstants,
                          self._use_dirstate_v2,
                      )
                      return self._map
                  @property
                  def _sparsematcher(self):
                      """The matcher for the sparse checkout.
                      The working directory may not include every file from a manifest. The
                      matcher obtained by this property will match a path if it is to be
                      included in the working directory.
                      """
                      # TODO there is potential to cache this property. For now, the matcher
                      # is resolved on every access. (But the called function does use a
                      # cache to keep the lookup fast.)
                      return self._sparsematchfn()
                  @repocache(b'branch')
                  def _branch(self):
                      try:
                          return self._opener.read(b"branch").strip() or b"default"
                      except IOError as inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          return b"default"
                  @property
                  def _pl(self):
                      return self._map.parents()
                  def hasdir(self, d):
                      return self._map.hastrackeddir(d)
                  @rootcache(b'.hgignore')
                  def _ignore(self):
                      files = self._ignorefiles()
                      if not files:
                          return matchmod.never()
                      pats = [b'include:%s' % f for f in files]
                      return matchmod.match(self._root, b'', [], pats, warn=self._ui.warn)
                  @propertycache
                  def _slash(self):
                      return self._ui.configbool(b'ui', b'slash') and pycompat.ossep != b'/'
                  @propertycache
                  def _checklink(self):
                      return util.checklink(self._root)
                  @propertycache
                  def _checkexec(self):
                      return bool(util.checkexec(self._root))
                  @propertycache
                  def _checkcase(self):
                      return not util.fscasesensitive(self._join(b'.hg'))
                  def _join(self, f):
                      # much faster than os.path.join()
                      # it's safe because f is always a relative path
                      return self._rootdir + f
                  def flagfunc(self, buildfallback):
                      if self._checklink and self._checkexec:
                          def f(x):
                              try:
                                  st = os.lstat(self._join(x))
                                  if util.statislink(st):
                                      return b'l'
                                  if util.statisexec(st):
                                      return b'x'
                              except OSError:
                                  pass
                              return b''
                          return f
                      fallback = buildfallback()
                      if self._checklink:
                          def f(x):
                              if os.path.islink(self._join(x)):
                                  return b'l'
                              if b'x' in fallback(x):
                                  return b'x'
                              return b''
                          return f
                      if self._checkexec:
                          def f(x):
                              if b'l' in fallback(x):
                                  return b'l'
                              if util.isexec(self._join(x)):
                                  return b'x'
                              return b''
                          return f
                      else:
                          return fallback
                  @propertycache
                  def _cwd(self):
                      # internal config: ui.forcecwd
                      forcecwd = self._ui.config(b'ui', b'forcecwd')
                      if forcecwd:
                          return forcecwd
                      return encoding.getcwd()
                  def getcwd(self):
                      """Return the path from which a canonical path is calculated.
                      This path should be used to resolve file patterns or to convert
                      canonical paths back to file paths for display. It shouldn't be
                      used to get real file paths. Use vfs functions instead.
                      """
                      cwd = self._cwd
                      if cwd == self._root:
                          return b''
                      # self._root ends with a path separator if self._root is '/' or 'C:\'
                      rootsep = self._root
                      if not util.endswithsep(rootsep):
                          rootsep += pycompat.ossep
                      if cwd.startswith(rootsep):
                          return cwd[len(rootsep) :]
                      else:
                          # we're outside the repo. return an absolute path.
                          return cwd
                  def pathto(self, f, cwd=None):
                      if cwd is None:
                          cwd = self.getcwd()
                      path = util.pathto(self._root, cwd, f)
                      if self._slash:
                          return util.pconvert(path)
                      return path
                  def __getitem__(self, key):
                      """Return the current state of key (a filename) in the dirstate.
                      States are:
                        n  normal
                        m  needs merging
                        r  marked for removal
                        a  marked for addition
                        ?  not tracked
                      """
                      return self._map.get(key, (b"?",))[0]
                  def __contains__(self, key):
                      return key in self._map
                  def __iter__(self):
                      return iter(sorted(self._map))
                  def items(self):
                      return pycompat.iteritems(self._map)
                  iteritems = items
                  def parents(self):
                      return [self._validate(p) for p in self._pl]
                  def p1(self):
                      return self._validate(self._pl[0])
                  def p2(self):
                      return self._validate(self._pl[1])
                  def branch(self):
                      return encoding.tolocal(self._branch)
                  def setparents(self, p1, p2=None):
                      """Set dirstate parents to p1 and p2.
                      When moving from two parents to one, 'm' merged entries a
                      adjusted to normal and previous copy records discarded and
                      returned by the call.
                      See localrepo.setparents()
                      """
                      if p2 is None:
                          p2 = self._nodeconstants.nullid
                      if self._parentwriters == 0:
                          raise ValueError(
                              b"cannot set dirstate parent outside of "
                              b"dirstate.parentchange context manager"
                          )
                      self._dirty = True
                      oldp2 = self._pl[1]
                      if self._origpl is None:
                          self._origpl = self._pl
                      self._map.setparents(p1, p2)
                      copies = {}
                      if (
                          oldp2 != self._nodeconstants.nullid
                          and p2 == self._nodeconstants.nullid
                      ):
                          candidatefiles = self._map.non_normal_or_other_parent_paths()
                          for f in candidatefiles:
                              s = self._map.get(f)
                              if s is None:
                                  continue
                              # Discard 'm' markers when moving away from a merge state
                              if s[0] == b'm':
                                  source = self._map.copymap.get(f)
                                  if source:
                                      copies[f] = source
                                  self.normallookup(f)
                              # Also fix up otherparent markers
                              elif s[0] == b'n' and s[2] == -2:
                                  source = self._map.copymap.get(f)
                                  if source:
                                      copies[f] = source
                                  self.add(f)
                      return copies
                  def setbranch(self, branch):
                      self.__class__._branch.set(self, encoding.fromlocal(branch))
                      f = self._opener(b'branch', b'w', atomictemp=True, checkambig=True)
                      try:
                          f.write(self._branch + b'\n')
                          f.close()
                          # make sure filecache has the correct stat info for _branch after
                          # replacing the underlying file
                          ce = self._filecache[b'_branch']
                          if ce:
                              ce.refresh()
                      except:  # re-raises
                          f.discard()
                          raise
                  def invalidate(self):
                      """Causes the next access to reread the dirstate.
                      This is different from localrepo.invalidatedirstate() because it always
                      rereads the dirstate. Use localrepo.invalidatedirstate() if you want to
                      check whether the dirstate has changed before rereading it."""
                      for a in ("_map", "_branch", "_ignore"):
                          if a in self.__dict__:
                              delattr(self, a)
                      self._lastnormaltime = 0
                      self._dirty = False
                      self._updatedfiles.clear()
                      self._parentwriters = 0
                      self._origpl = None
                  def copy(self, source, dest):
                      """Mark dest as a copy of source. Unmark dest if source is None."""
                      if source == dest:
                          return
                      self._dirty = True
                      if source is not None:
                          self._map.copymap[dest] = source
                          self._updatedfiles.add(source)
                          self._updatedfiles.add(dest)
                      elif self._map.copymap.pop(dest, None):
                          self._updatedfiles.add(dest)
                  def copied(self, file):
                      return self._map.copymap.get(file, None)
                  def copies(self):
                      return self._map.copymap
                  def _addpath(self, f, state, mode, size, mtime):
                      oldstate = self[f]
                      if state == b'a' or oldstate == b'r':
                          scmutil.checkfilename(f)
                          if self._map.hastrackeddir(f):
                              raise error.Abort(
                                  _(b'directory %r already in dirstate') % pycompat.bytestr(f)
                              )
                          # shadows
                          for d in pathutil.finddirs(f):
                              if self._map.hastrackeddir(d):
                                  break
                              entry = self._map.get(d)
                              if entry is not None and entry[0] != b'r':
                                  raise error.Abort(
                                      _(b'file %r in dirstate clashes with %r')
                                      % (pycompat.bytestr(d), pycompat.bytestr(f))
                                  )
                      self._dirty = True
                      self._updatedfiles.add(f)
                      self._map.addfile(f, oldstate, state, mode, size, mtime)
                  def normal(self, f, parentfiledata=None):
                      """Mark a file normal and clean.
                      parentfiledata: (mode, size, mtime) of the clean file
                      parentfiledata should be computed from memory (for mode,
                      size), as or close as possible from the point where we
                      determined the file was clean, to limit the risk of the
                      file having been changed by an external process between the
                      moment where the file was determined to be clean and now."""
                      if parentfiledata:
                          (mode, size, mtime) = parentfiledata
                      else:
                          s = os.lstat(self._join(f))
                          mode = s.st_mode
                          size = s.st_size
                          mtime = s[stat.ST_MTIME]
                      self._addpath(f, b'n', mode, size & _rangemask, mtime & _rangemask)
                      self._map.copymap.pop(f, None)
                      if f in self._map.nonnormalset:
                          self._map.nonnormalset.remove(f)
                      if mtime > self._lastnormaltime:
                          # Remember the most recent modification timeslot for status(),
                          # to make sure we won't miss future size-preserving file content
                          # modifications that happen within the same timeslot.
                          self._lastnormaltime = mtime
                  def normallookup(self, f):
                      '''Mark a file normal, but possibly dirty.'''
                      if self._pl[1] != self._nodeconstants.nullid:
                          # if there is a merge going on and the file was either
                          # in state 'm' (-1) or coming from other parent (-2) before
                          # being removed, restore that state.
                          entry = self._map.get(f)
                          if entry is not None:
                              if entry[0] == b'r' and entry[2] in (-1, -2):
                                  source = self._map.copymap.get(f)
                                  if entry[2] == -1:
                                      self.merge(f)
                                  elif entry[2] == -2:
                                      self.otherparent(f)
                                  if source:
                                      self.copy(source, f)
                                  return
                              if entry[0] == b'm' or entry[0] == b'n' and entry[2] == -2:
                                  return
                      self._addpath(f, b'n', 0, -1, -1)
                      self._map.copymap.pop(f, None)
                  def otherparent(self, f):
                      '''Mark as coming from the other parent, always dirty.'''
                      if self._pl[1] == self._nodeconstants.nullid:
                          raise error.Abort(
                              _(b"setting %r to other parent only allowed in merges") % f
                          )
                      if f in self and self[f] == b'n':
                          # merge-like
                          self._addpath(f, b'm', 0, -2, -1)
                      else:
                          # add-like
                          self._addpath(f, b'n', 0, -2, -1)
                      self._map.copymap.pop(f, None)
                  def add(self, f):
                      '''Mark a file added.'''
                      self._addpath(f, b'a', 0, -1, -1)
                      self._map.copymap.pop(f, None)
                  def remove(self, f):
                      '''Mark a file removed.'''
                      self._dirty = True
                      oldstate = self[f]
                      size = 0
                      if self._pl[1] != self._nodeconstants.nullid:
                          entry = self._map.get(f)
                          if entry is not None:
                              # backup the previous state
                              if entry[0] == b'm':  # merge
                                  size = -1
                              elif entry[0] == b'n' and entry[2] == -2:  # other parent
                                  size = -2
                                  self._map.otherparentset.add(f)
                      self._updatedfiles.add(f)
                      self._map.removefile(f, oldstate, size)
                      if size == 0:
                          self._map.copymap.pop(f, None)
                  def merge(self, f):
                      '''Mark a file merged.'''
                      if self._pl[1] == self._nodeconstants.nullid:
                          return self.normallookup(f)
                      return self.otherparent(f)
                  def drop(self, f):
                      '''Drop a file from the dirstate'''
                      oldstate = self[f]
                      if self._map.dropfile(f, oldstate):
                          self._dirty = True
                          self._updatedfiles.add(f)
                          self._map.copymap.pop(f, None)
                  def _discoverpath(self, path, normed, ignoremissing, exists, storemap):
                      if exists is None:
                          exists = os.path.lexists(os.path.join(self._root, path))
                      if not exists:
                          # Maybe a path component exists
                          if not ignoremissing and b'/' in path:
                              d, f = path.rsplit(b'/', 1)
                              d = self._normalize(d, False, ignoremissing, None)
                              folded = d + b"/" + f
                          else:
                              # No path components, preserve original case
                              folded = path
                      else:
                          # recursively normalize leading directory components
                          # against dirstate
                          if b'/' in normed:
                              d, f = normed.rsplit(b'/', 1)
                              d = self._normalize(d, False, ignoremissing, True)
                              r = self._root + b"/" + d
                              folded = d + b"/" + util.fspath(f, r)
                          else:
                              folded = util.fspath(normed, self._root)
                          storemap[normed] = folded
                      return folded
                  def _normalizefile(self, path, isknown, ignoremissing=False, exists=None):
                      normed = util.normcase(path)
                      folded = self._map.filefoldmap.get(normed, None)
                      if folded is None:
                          if isknown:
                              folded = path
                          else:
                              folded = self._discoverpath(
                                  path, normed, ignoremissing, exists, self._map.filefoldmap
                              )
                      return folded
                  def _normalize(self, path, isknown, ignoremissing=False, exists=None):
                      normed = util.normcase(path)
                      folded = self._map.filefoldmap.get(normed, None)
                      if folded is None:
                          folded = self._map.dirfoldmap.get(normed, None)
                      if folded is None:
                          if isknown:
                              folded = path
                          else:
                              # store discovered result in dirfoldmap so that future
                              # normalizefile calls don't start matching directories
                              folded = self._discoverpath(
                                  path, normed, ignoremissing, exists, self._map.dirfoldmap
                              )
                      return folded
                  def normalize(self, path, isknown=False, ignoremissing=False):
                      """
                      normalize the case of a pathname when on a casefolding filesystem
                      isknown specifies whether the filename came from walking the
                      disk, to avoid extra filesystem access.
                      If ignoremissing is True, missing path are returned
                      unchanged. Otherwise, we try harder to normalize possibly
                      existing path components.
                      The normalized case is determined based on the following precedence:
                      - version of name already stored in the dirstate
                      - version of name stored on disk
                      - version provided via command arguments
                      """
                      if self._checkcase:
                          return self._normalize(path, isknown, ignoremissing)
                      return path
                  def clear(self):
                      self._map.clear()
                      self._lastnormaltime = 0
                      self._updatedfiles.clear()
                      self._dirty = True
                  def rebuild(self, parent, allfiles, changedfiles=None):
                      if changedfiles is None:
                          # Rebuild entire dirstate
                          to_lookup = allfiles
                          to_drop = []
                          lastnormaltime = self._lastnormaltime
                          self.clear()
                          self._lastnormaltime = lastnormaltime
                      elif len(changedfiles) < 10:
                          # Avoid turning allfiles into a set, which can be expensive if it's
                          # large.
                          to_lookup = []
                          to_drop = []
                          for f in changedfiles:
                              if f in allfiles:
                                  to_lookup.append(f)
                              else:
                                  to_drop.append(f)
                      else:
                          changedfilesset = set(changedfiles)
                          to_lookup = changedfilesset & set(allfiles)
                          to_drop = changedfilesset - to_lookup
                      if self._origpl is None:
                          self._origpl = self._pl
                      self._map.setparents(parent, self._nodeconstants.nullid)
                      for f in to_lookup:
                          self.normallookup(f)
                      for f in to_drop:
                          self.drop(f)
                      self._dirty = True
                  def identity(self):
                      """Return identity of dirstate itself to detect changing in storage
                      If identity of previous dirstate is equal to this, writing
                      changes based on the former dirstate out can keep consistency.
                      """
                      return self._map.identity
                  def write(self, tr):
                      if not self._dirty:
                          return
                      filename = self._filename
                      if tr:
                          # 'dirstate.write()' is not only for writing in-memory
                          # changes out, but also for dropping ambiguous timestamp.
                          # delayed writing re-raise "ambiguous timestamp issue".
                          # See also the wiki page below for detail:
                          # https://www.mercurial-scm.org/wiki/DirstateTransactionPlan
                          # emulate dropping timestamp in 'parsers.pack_dirstate'
                          now = _getfsnow(self._opener)
                          self._map.clearambiguoustimes(self._updatedfiles, now)
                          # emulate that all 'dirstate.normal' results are written out
                          self._lastnormaltime = 0
                          self._updatedfiles.clear()
                          # delay writing in-memory changes out
                          tr.addfilegenerator(
                              b'dirstate',
                              (self._filename,),
                              self._writedirstate,
                              location=b'plain',
                          )
                          return
                      st = self._opener(filename, b"w", atomictemp=True, checkambig=True)
                      self._writedirstate(st)
                  def addparentchangecallback(self, category, callback):
                      """add a callback to be called when the wd parents are changed
                      Callback will be called with the following arguments:
                          dirstate, (oldp1, oldp2), (newp1, newp2)
                      Category is a unique identifier to allow overwriting an old callback
                      with a newer callback.
                      """
                      self._plchangecallbacks[category] = callback
                  def _writedirstate(self, st):
                      # notify callbacks about parents change
                      if self._origpl is not None and self._origpl != self._pl:
                          for c, callback in sorted(
                              pycompat.iteritems(self._plchangecallbacks)
                          ):
                              callback(self, self._origpl, self._pl)
                          self._origpl = None
                      # use the modification time of the newly created temporary file as the
                      # filesystem's notion of 'now'
                      now = util.fstat(st)[stat.ST_MTIME] & _rangemask
                      # enough 'delaywrite' prevents 'pack_dirstate' from dropping
                      # timestamp of each entries in dirstate, because of 'now > mtime'
                      delaywrite = self._ui.configint(b'debug', b'dirstate.delaywrite')
                      if delaywrite > 0:
                          # do we have any files to delay for?
                          for f, e in pycompat.iteritems(self._map):
                              if e[0] == b'n' and e[3] == now:
                                  import time  # to avoid useless import
                                  # rather than sleep n seconds, sleep until the next
                                  # multiple of n seconds
                                  clock = time.time()
                                  start = int(clock) - (int(clock) % delaywrite)
                                  end = start + delaywrite
                                  time.sleep(end - clock)
                                  now = end  # trust our estimate that the end is near now
                                  break
                      self._map.write(st, now)
                      self._lastnormaltime = 0
                      self._dirty = False
                  def _dirignore(self, f):
                      if self._ignore(f):
                          return True
                      for p in pathutil.finddirs(f):
                          if self._ignore(p):
                              return True
                      return False
                  def _ignorefiles(self):
                      files = []
                      if os.path.exists(self._join(b'.hgignore')):
                          files.append(self._join(b'.hgignore'))
                      for name, path in self._ui.configitems(b"ui"):
                          if name == b'ignore' or name.startswith(b'ignore.'):
                              # we need to use os.path.join here rather than self._join
                              # because path is arbitrary and user-specified
                              files.append(os.path.join(self._rootdir, util.expandpath(path)))
                      return files
                  def _ignorefileandline(self, f):
                      files = collections.deque(self._ignorefiles())
                      visited = set()
                      while files:
                          i = files.popleft()
                          patterns = matchmod.readpatternfile(
                              i, self._ui.warn, sourceinfo=True
                          )
                          for pattern, lineno, line in patterns:
                              kind, p = matchmod._patsplit(pattern, b'glob')
                              if kind == b"subinclude":
                                  if p not in visited:
                                      files.append(p)
                                  continue
                              m = matchmod.match(
                                  self._root, b'', [], [pattern], warn=self._ui.warn
                              )
                              if m(f):
                                  return (i, lineno, line)
                          visited.add(i)
                      return (None, -1, b"")
                  def _walkexplicit(self, match, subrepos):
                      """Get stat data about the files explicitly specified by match.
                      Return a triple (results, dirsfound, dirsnotfound).
                      - results is a mapping from filename to stat result. It also contains
                        listings mapping subrepos and .hg to None.
                      - dirsfound is a list of files found to be directories.
                      - dirsnotfound is a list of files that the dirstate thinks are
                        directories and that were not found."""
                      def badtype(mode):
                          kind = _(b'unknown')
                          if stat.S_ISCHR(mode):
                              kind = _(b'character device')
                          elif stat.S_ISBLK(mode):
                              kind = _(b'block device')
                          elif stat.S_ISFIFO(mode):
                              kind = _(b'fifo')
                          elif stat.S_ISSOCK(mode):
                              kind = _(b'socket')
                          elif stat.S_ISDIR(mode):
                              kind = _(b'directory')
                          return _(b'unsupported file type (type is %s)') % kind
                      badfn = match.bad
                      dmap = self._map
                      lstat = os.lstat
                      getkind = stat.S_IFMT
                      dirkind = stat.S_IFDIR
                      regkind = stat.S_IFREG
                      lnkkind = stat.S_IFLNK
                      join = self._join
                      dirsfound = []
                      foundadd = dirsfound.append
                      dirsnotfound = []
                      notfoundadd = dirsnotfound.append
                      if not match.isexact() and self._checkcase:
                          normalize = self._normalize
                      else:
                          normalize = None
                      files = sorted(match.files())
                      subrepos.sort()
                      i, j = 0, 0
                      while i < len(files) and j < len(subrepos):
                          subpath = subrepos[j] + b"/"
                          if files[i] < subpath:
                              i += 1
                              continue
                          while i < len(files) and files[i].startswith(subpath):
                              del files[i]
                          j += 1
                      if not files or b'' in files:
                          files = [b'']
                          # constructing the foldmap is expensive, so don't do it for the
                          # common case where files is ['']
                          normalize = None
                      results = dict.fromkeys(subrepos)
                      results[b'.hg'] = None
                      for ff in files:
                          if normalize:
                              nf = normalize(ff, False, True)
                          else:
                              nf = ff
                          if nf in results:
                              continue
                          try:
                              st = lstat(join(nf))
                              kind = getkind(st.st_mode)
                              if kind == dirkind:
                                  if nf in dmap:
                                      # file replaced by dir on disk but still in dirstate
                                      results[nf] = None
                                  foundadd((nf, ff))
                              elif kind == regkind or kind == lnkkind:
                                  results[nf] = st
                              else:
                                  badfn(ff, badtype(kind))
                                  if nf in dmap:
                                      results[nf] = None
                          except OSError as inst:  # nf not found on disk - it is dirstate only
                              if nf in dmap:  # does it exactly match a missing file?
                                  results[nf] = None
                              else:  # does it match a missing directory?
                                  if self._map.hasdir(nf):
                                      notfoundadd(nf)
                                  else:
                                      badfn(ff, encoding.strtolocal(inst.strerror))
                      # match.files() may contain explicitly-specified paths that shouldn't
                      # be taken; drop them from the list of files found. dirsfound/notfound
                      # aren't filtered here because they will be tested later.
                      if match.anypats():
                          for f in list(results):
                              if f == b'.hg' or f in subrepos:
                                  # keep sentinel to disable further out-of-repo walks
                                  continue
                              if not match(f):
                                  del results[f]
                      # Case insensitive filesystems cannot rely on lstat() failing to detect
                      # a case-only rename.  Prune the stat object for any file that does not
                      # match the case in the filesystem, if there are multiple files that
                      # normalize to the same path.
                      if match.isexact() and self._checkcase:
                          normed = {}
                          for f, st in pycompat.iteritems(results):
                              if st is None:
                                  continue
                              nc = util.normcase(f)
                              paths = normed.get(nc)
                              if paths is None:
                                  paths = set()
                                  normed[nc] = paths
                              paths.add(f)
                          for norm, paths in pycompat.iteritems(normed):
                              if len(paths) > 1:
                                  for path in paths:
                                      folded = self._discoverpath(
                                          path, norm, True, None, self._map.dirfoldmap
                                      )
                                      if path != folded:
                                          results[path] = None
                      return results, dirsfound, dirsnotfound
                  def walk(self, match, subrepos, unknown, ignored, full=True):
                      """
                      Walk recursively through the directory tree, finding all files
                      matched by match.
                      If full is False, maybe skip some known-clean files.
                      Return a dict mapping filename to stat-like object (either
                      mercurial.osutil.stat instance or return value of os.stat()).
                      """
                      # full is a flag that extensions that hook into walk can use -- this
                      # implementation doesn't use it at all. This satisfies the contract
                      # because we only guarantee a "maybe".
                      if ignored:
                          ignore = util.never
                          dirignore = util.never
                      elif unknown:
                          ignore = self._ignore
                          dirignore = self._dirignore
                      else:
                          # if not unknown and not ignored, drop dir recursion and step 2
                          ignore = util.always
                          dirignore = util.always
                      matchfn = match.matchfn
                      matchalways = match.always()
                      matchtdir = match.traversedir
                      dmap = self._map
                      listdir = util.listdir
                      lstat = os.lstat
                      dirkind = stat.S_IFDIR
                      regkind = stat.S_IFREG
                      lnkkind = stat.S_IFLNK
                      join = self._join
                      exact = skipstep3 = False
                      if match.isexact():  # match.exact
                          exact = True
                          dirignore = util.always  # skip step 2
                      elif match.prefix():  # match.match, no patterns
                          skipstep3 = True
                      if not exact and self._checkcase:
                          normalize = self._normalize
                          normalizefile = self._normalizefile
                          skipstep3 = False
                      else:
                          normalize = self._normalize
                          normalizefile = None
                      # step 1: find all explicit files
                      results, work, dirsnotfound = self._walkexplicit(match, subrepos)
                      if matchtdir:
                          for d in work:
                              matchtdir(d[0])
                          for d in dirsnotfound:
                              matchtdir(d)
                      skipstep3 = skipstep3 and not (work or dirsnotfound)
                      work = [d for d in work if not dirignore(d[0])]
                      # step 2: visit subdirectories
                      def traverse(work, alreadynormed):
                          wadd = work.append
                          while work:
                              tracing.counter('dirstate.walk work', len(work))
                              nd = work.pop()
                              visitentries = match.visitchildrenset(nd)
                              if not visitentries:
                                  continue
                              if visitentries == b'this' or visitentries == b'all':
                                  visitentries = None
                              skip = None
                              if nd != b'':
                                  skip = b'.hg'
                              try:
                                  with tracing.log('dirstate.walk.traverse listdir %s', nd):
                                      entries = listdir(join(nd), stat=True, skip=skip)
                              except OSError as inst:
                                  if inst.errno in (errno.EACCES, errno.ENOENT):
                                      match.bad(
                                          self.pathto(nd), encoding.strtolocal(inst.strerror)
                                      )
                                      continue
                                  raise
                              for f, kind, st in entries:
                                  # Some matchers may return files in the visitentries set,
                                  # instead of 'this', if the matcher explicitly mentions them
                                  # and is not an exactmatcher. This is acceptable; we do not
                                  # make any hard assumptions about file-or-directory below
                                  # based on the presence of `f` in visitentries. If
                                  # visitchildrenset returned a set, we can always skip the
                                  # entries *not* in the set it provided regardless of whether
                                  # they're actually a file or a directory.
                                  if visitentries and f not in visitentries:
                                      continue
                                  if normalizefile:
                                      # even though f might be a directory, we're only
                                      # interested in comparing it to files currently in the
                                      # dmap -- therefore normalizefile is enough
                                      nf = normalizefile(
                                          nd and (nd + b"/" + f) or f, True, True
                                      )
                                  else:
                                      nf = nd and (nd + b"/" + f) or f
                                  if nf not in results:
                                      if kind == dirkind:
                                          if not ignore(nf):
                                              if matchtdir:
                                                  matchtdir(nf)
                                              wadd(nf)
                                          if nf in dmap and (matchalways or matchfn(nf)):
                                              results[nf] = None
                                      elif kind == regkind or kind == lnkkind:
                                          if nf in dmap:
                                              if matchalways or matchfn(nf):
                                                  results[nf] = st
                                          elif (matchalways or matchfn(nf)) and not ignore(
                                              nf
                                          ):
                                              # unknown file -- normalize if necessary
                                              if not alreadynormed:
                                                  nf = normalize(nf, False, True)
                                              results[nf] = st
                                      elif nf in dmap and (matchalways or matchfn(nf)):
                                          results[nf] = None
                      for nd, d in work:
                          # alreadynormed means that processwork doesn't have to do any
                          # expensive directory normalization
                          alreadynormed = not normalize or nd == d
                          traverse([d], alreadynormed)
                      for s in subrepos:
                          del results[s]
                      del results[b'.hg']
                      # step 3: visit remaining files from dmap
                      if not skipstep3 and not exact:
                          # If a dmap file is not in results yet, it was either
                          # a) not matching matchfn b) ignored, c) missing, or d) under a
                          # symlink directory.
                          if not results and matchalways:
                              visit = [f for f in dmap]
                          else:
                              visit = [f for f in dmap if f not in results and matchfn(f)]
                          visit.sort()
                          if unknown:
                              # unknown == True means we walked all dirs under the roots
                              # that wasn't ignored, and everything that matched was stat'ed
                              # and is already in results.
                              # The rest must thus be ignored or under a symlink.
                              audit_path = pathutil.pathauditor(self._root, cached=True)
                              for nf in iter(visit):
                                  # If a stat for the same file was already added with a
                                  # different case, don't add one for this, since that would
                                  # make it appear as if the file exists under both names
                                  # on disk.
                                  if (
                                      normalizefile
                                      and normalizefile(nf, True, True) in results
                                  ):
                                      results[nf] = None
                                  # Report ignored items in the dmap as long as they are not
                                  # under a symlink directory.
                                  elif audit_path.check(nf):
                                      try:
                                          results[nf] = lstat(join(nf))
                                          # file was just ignored, no links, and exists
                                      except OSError:
                                          # file doesn't exist
                                          results[nf] = None
                                  else:
                                      # It's either missing or under a symlink directory
                                      # which we in this case report as missing
                                      results[nf] = None
                          else:
                              # We may not have walked the full directory tree above,
                              # so stat and check everything we missed.
                              iv = iter(visit)
                              for st in util.statfiles([join(i) for i in visit]):
                                  results[next(iv)] = st
                      return results
                  def _rust_status(self, matcher, list_clean, list_ignored, list_unknown):
                      # Force Rayon (Rust parallelism library) to respect the number of
                      # workers. This is a temporary workaround until Rust code knows
                      # how to read the config file.
                      numcpus = self._ui.configint(b"worker", b"numcpus")
                      if numcpus is not None:
                          encoding.environ.setdefault(b'RAYON_NUM_THREADS', b'%d' % numcpus)
                      workers_enabled = self._ui.configbool(b"worker", b"enabled", True)
                      if not workers_enabled:
                          encoding.environ[b"RAYON_NUM_THREADS"] = b"1"
                      (
                          lookup,
                          modified,
                          added,
                          removed,
                          deleted,
                          clean,
                          ignored,
                          unknown,
                          warnings,
                          bad,
                          traversed,
+                         dirty,
                      ) = rustmod.status(
                          self._map._rustmap,
                          matcher,
                          self._rootdir,
                          self._ignorefiles(),
                          self._checkexec,
                          self._lastnormaltime,
                          bool(list_clean),
                          bool(list_ignored),
                          bool(list_unknown),
                          bool(matcher.traversedir),
                      )
+                     self._dirty |= dirty
                      if matcher.traversedir:
                          for dir in traversed:
                              matcher.traversedir(dir)
                      if self._ui.warn:
                          for item in warnings:
                              if isinstance(item, tuple):
                                  file_path, syntax = item
                                  msg = _(b"%s: ignoring invalid syntax '%s'\n") % (
                                      file_path,
                                      syntax,
                                  )
                                  self._ui.warn(msg)
                              else:
                                  msg = _(b"skipping unreadable pattern file '%s': %s\n")
                                  self._ui.warn(
                                      msg
                                      % (
                                          pathutil.canonpath(
                                              self._rootdir, self._rootdir, item
                                          ),
                                          b"No such file or directory",
                                      )
                                  )
                      for (fn, message) in bad:
                          matcher.bad(fn, encoding.strtolocal(message))
                      status = scmutil.status(
                          modified=modified,
                          added=added,
                          removed=removed,
                          deleted=deleted,
                          unknown=unknown,
                          ignored=ignored,
                          clean=clean,
                      )
                      return (lookup, status)
                  def status(self, match, subrepos, ignored, clean, unknown):
                      """Determine the status of the working copy relative to the
                      dirstate and return a pair of (unsure, status), where status is of type
                      scmutil.status and:
                        unsure:
                          files that might have been modified since the dirstate was
                          written, but need to be read to be sure (size is the same
                          but mtime differs)
                        status.modified:
                          files that have definitely been modified since the dirstate
                          was written (different size or mode)
                        status.clean:
                          files that have definitely not been modified since the
                          dirstate was written
                      """
                      listignored, listclean, listunknown = ignored, clean, unknown
                      lookup, modified, added, unknown, ignored = [], [], [], [], []
                      removed, deleted, clean = [], [], []
                      dmap = self._map
                      dmap.preload()
                      use_rust = True
                      allowed_matchers = (
                          matchmod.alwaysmatcher,
                          matchmod.exactmatcher,
                          matchmod.includematcher,
                      )
                      if rustmod is None:
                          use_rust = False
                      elif self._checkcase:
                          # Case-insensitive filesystems are not handled yet
                          use_rust = False
                      elif subrepos:
                          use_rust = False
                      elif sparse.enabled:
                          use_rust = False
                      elif not isinstance(match, allowed_matchers):
                          # Some matchers have yet to be implemented
                          use_rust = False
                      if use_rust:
                          try:
                              return self._rust_status(
                                  match, listclean, listignored, listunknown
                              )
                          except rustmod.FallbackError:
                              pass
                      def noop(f):
                          pass
                      dcontains = dmap.__contains__
                      dget = dmap.__getitem__
                      ladd = lookup.append  # aka "unsure"
                      madd = modified.append
                      aadd = added.append
                      uadd = unknown.append if listunknown else noop
                      iadd = ignored.append if listignored else noop
                      radd = removed.append
                      dadd = deleted.append
                      cadd = clean.append if listclean else noop
                      mexact = match.exact
                      dirignore = self._dirignore
                      checkexec = self._checkexec
                      copymap = self._map.copymap
                      lastnormaltime = self._lastnormaltime
                      # We need to do full walks when either
                      # - we're listing all clean files, or
                      # - match.traversedir does something, because match.traversedir should
                      #   be called for every dir in the working dir
                      full = listclean or match.traversedir is not None
                      for fn, st in pycompat.iteritems(
                          self.walk(match, subrepos, listunknown, listignored, full=full)
                      ):
                          if not dcontains(fn):
                              if (listignored or mexact(fn)) and dirignore(fn):
                                  if listignored:
                                      iadd(fn)
                              else:
                                  uadd(fn)
                              continue
                          # This is equivalent to 'state, mode, size, time = dmap[fn]' but not
                          # written like that for performance reasons. dmap[fn] is not a
                          # Python tuple in compiled builds. The CPython UNPACK_SEQUENCE
                          # opcode has fast paths when the value to be unpacked is a tuple or
                          # a list, but falls back to creating a full-fledged iterator in
                          # general. That is much slower than simply accessing and storing the
                          # tuple members one by one.
                          t = dget(fn)
                          state = t[0]
                          mode = t[1]
                          size = t[2]
                          time = t[3]
                          if not st and state in b"nma":
                              dadd(fn)
                          elif state == b'n':
                              if (
                                  size >= 0
                                  and (
                                      (size != st.st_size and size != st.st_size & _rangemask)
                                      or ((mode ^ st.st_mode) & 0o100 and checkexec)
                                  )
                                  or size == -2  # other parent
                                  or fn in copymap
                              ):
                                  if stat.S_ISLNK(st.st_mode) and size != st.st_size:
                                      # issue6456: Size returned may be longer due to
                                      # encryption on EXT-4 fscrypt, undecided.
                                      ladd(fn)
                                  else:
                                      madd(fn)
                              elif (
                                  time != st[stat.ST_MTIME]
                                  and time != st[stat.ST_MTIME] & _rangemask
                              ):
                                  ladd(fn)
                              elif st[stat.ST_MTIME] == lastnormaltime:
                                  # fn may have just been marked as normal and it may have
                                  # changed in the same second without changing its size.
                                  # This can happen if we quickly do multiple commits.
                                  # Force lookup, so we don't miss such a racy file change.
                                  ladd(fn)
                              elif listclean:
                                  cadd(fn)
                          elif state == b'm':
                              madd(fn)
                          elif state == b'a':
                              aadd(fn)
                          elif state == b'r':
                              radd(fn)
                      status = scmutil.status(
                          modified, added, removed, deleted, unknown, ignored, clean
                      )
                      return (lookup, status)
                  def matches(self, match):
                      """
                      return files in the dirstate (in whatever state) filtered by match
                      """
                      dmap = self._map
                      if rustmod is not None:
                          dmap = self._map._rustmap
                      if match.always():
                          return dmap.keys()
                      files = match.files()
                      if match.isexact():
                          # fast path -- filter the other way around, since typically files is
                          # much smaller than dmap
                          return [f for f in files if f in dmap]
                      if match.prefix() and all(fn in dmap for fn in files):
                          # fast path -- all the values are known to be files, so just return
                          # that
                          return list(files)
                      return [f for f in dmap if match(f)]
                  def _actualfilename(self, tr):
                      if tr:
                          return self._pendingfilename
                      else:
                          return self._filename
                  def savebackup(self, tr, backupname):
                      '''Save current dirstate into backup file'''
                      filename = self._actualfilename(tr)
                      assert backupname != filename
                      # use '_writedirstate' instead of 'write' to write changes certainly,
                      # because the latter omits writing out if transaction is running.
                      # output file will be used to create backup of dirstate at this point.
                      if self._dirty or not self._opener.exists(filename):
                          self._writedirstate(
                              self._opener(filename, b"w", atomictemp=True, checkambig=True)
                          )
                      if tr:
                          # ensure that subsequent tr.writepending returns True for
                          # changes written out above, even if dirstate is never
                          # changed after this
                          tr.addfilegenerator(
                              b'dirstate',
                              (self._filename,),
                              self._writedirstate,
                              location=b'plain',
                          )
                          # ensure that pending file written above is unlinked at
                          # failure, even if tr.writepending isn't invoked until the
                          # end of this transaction
                          tr.registertmp(filename, location=b'plain')
                      self._opener.tryunlink(backupname)
                      # hardlink backup is okay because _writedirstate is always called
                      # with an "atomictemp=True" file.
                      util.copyfile(
                          self._opener.join(filename),
                          self._opener.join(backupname),
                          hardlink=True,
                      )
                  def restorebackup(self, tr, backupname):
                      '''Restore dirstate by backup file'''
                      # this "invalidate()" prevents "wlock.release()" from writing
                      # changes of dirstate out after restoring from backup file
                      self.invalidate()
                      filename = self._actualfilename(tr)
                      o = self._opener
                      if util.samefile(o.join(backupname), o.join(filename)):
                          o.unlink(backupname)
                      else:
                          o.rename(backupname, filename, checkambig=True)
                  def clearbackup(self, tr, backupname):
                      '''Clear backup file'''
                      self._opener.unlink(backupname)
              class dirstatemap(object):
                  """Map encapsulating the dirstate's contents.
                  The dirstate contains the following state:
                  - `identity` is the identity of the dirstate file, which can be used to
                    detect when changes have occurred to the dirstate file.
                  - `parents` is a pair containing the parents of the working copy. The
                    parents are updated by calling `setparents`.
                  - the state map maps filenames to tuples of (state, mode, size, mtime),
                    where state is a single character representing 'normal', 'added',
                    'removed', or 'merged'. It is read by treating the dirstate as a
                    dict.  File state is updated by calling the `addfile`, `removefile` and
                    `dropfile` methods.
                  - `copymap` maps destination filenames to their source filename.
                  The dirstate also provides the following views onto the state:
                  - `nonnormalset` is a set of the filenames that have state other
                    than 'normal', or are normal but have an mtime of -1 ('normallookup').
                  - `otherparentset` is a set of the filenames that are marked as coming
                    from the second parent when the dirstate is currently being merged.
                  - `filefoldmap` is a dict mapping normalized filenames to the denormalized
                    form that they appear as in the dirstate.
                  - `dirfoldmap` is a dict mapping normalized directory names to the
                    denormalized form that they appear as in the dirstate.
                  """
                  def __init__(self, ui, opener, root, nodeconstants, use_dirstate_v2):
                      self._ui = ui
                      self._opener = opener
                      self._root = root
                      self._filename = b'dirstate'
                      self._nodelen = 20
                      self._nodeconstants = nodeconstants
                      assert (
                          not use_dirstate_v2
                      ), "should have detected unsupported requirement"
                      self._parents = None
                      self._dirtyparents = False
                      # for consistent view between _pl() and _read() invocations
                      self._pendingmode = None
                  @propertycache
                  def _map(self):
                      self._map = {}
                      self.read()
                      return self._map
                  @propertycache
                  def copymap(self):
                      self.copymap = {}
                      self._map
                      return self.copymap
                  def clear(self):
                      self._map.clear()
                      self.copymap.clear()
                      self.setparents(self._nodeconstants.nullid, self._nodeconstants.nullid)
                      util.clearcachedproperty(self, b"_dirs")
                      util.clearcachedproperty(self, b"_alldirs")
                      util.clearcachedproperty(self, b"filefoldmap")
                      util.clearcachedproperty(self, b"dirfoldmap")
                      util.clearcachedproperty(self, b"nonnormalset")
                      util.clearcachedproperty(self, b"otherparentset")
                  def items(self):
                      return pycompat.iteritems(self._map)
                  # forward for python2,3 compat
                  iteritems = items
                  def __len__(self):
                      return len(self._map)
                  def __iter__(self):
                      return iter(self._map)
                  def get(self, key, default=None):
                      return self._map.get(key, default)
                  def __contains__(self, key):
                      return key in self._map
                  def __getitem__(self, key):
                      return self._map[key]
                  def keys(self):
                      return self._map.keys()
                  def preload(self):
                      """Loads the underlying data, if it's not already loaded"""
                      self._map
                  def addfile(self, f, oldstate, state, mode, size, mtime):
                      """Add a tracked file to the dirstate."""
                      if oldstate in b"?r" and "_dirs" in self.__dict__:
                          self._dirs.addpath(f)
                      if oldstate == b"?" and "_alldirs" in self.__dict__:
                          self._alldirs.addpath(f)
                      self._map[f] = dirstatetuple(state, mode, size, mtime)
                      if state != b'n' or mtime == -1:
                          self.nonnormalset.add(f)
                      if size == -2:
                          self.otherparentset.add(f)
                  def removefile(self, f, oldstate, size):
                      """
                      Mark a file as removed in the dirstate.
                      The `size` parameter is used to store sentinel values that indicate
                      the file's previous state.  In the future, we should refactor this
                      to be more explicit about what that state is.
                      """
                      if oldstate not in b"?r" and "_dirs" in self.__dict__:
                          self._dirs.delpath(f)
                      if oldstate == b"?" and "_alldirs" in self.__dict__:
                          self._alldirs.addpath(f)
                      if "filefoldmap" in self.__dict__:
                          normed = util.normcase(f)
                          self.filefoldmap.pop(normed, None)
                      self._map[f] = dirstatetuple(b'r', 0, size, 0)
                      self.nonnormalset.add(f)
                  def dropfile(self, f, oldstate):
                      """
                      Remove a file from the dirstate.  Returns True if the file was
                      previously recorded.
                      """
                      exists = self._map.pop(f, None) is not None
                      if exists:
                          if oldstate != b"r" and "_dirs" in self.__dict__:
                              self._dirs.delpath(f)
                          if "_alldirs" in self.__dict__:
                              self._alldirs.delpath(f)
                      if "filefoldmap" in self.__dict__:
                          normed = util.normcase(f)
                          self.filefoldmap.pop(normed, None)
                      self.nonnormalset.discard(f)
                      return exists
                  def clearambiguoustimes(self, files, now):
                      for f in files:
                          e = self.get(f)
                          if e is not None and e[0] == b'n' and e[3] == now:
                              self._map[f] = dirstatetuple(e[0], e[1], e[2], -1)
                              self.nonnormalset.add(f)
                  def nonnormalentries(self):
                      '''Compute the nonnormal dirstate entries from the dmap'''
                      try:
                          return parsers.nonnormalotherparententries(self._map)
                      except AttributeError:
                          nonnorm = set()
                          otherparent = set()
                          for fname, e in pycompat.iteritems(self._map):
                              if e[0] != b'n' or e[3] == -1:
                                  nonnorm.add(fname)
                              if e[0] == b'n' and e[2] == -2:
                                  otherparent.add(fname)
                          return nonnorm, otherparent
                  @propertycache
                  def filefoldmap(self):
                      """Returns a dictionary mapping normalized case paths to their
                      non-normalized versions.
                      """
                      try:
                          makefilefoldmap = parsers.make_file_foldmap
                      except AttributeError:
                          pass
                      else:
                          return makefilefoldmap(
                              self._map, util.normcasespec, util.normcasefallback
                          )
                      f = {}
                      normcase = util.normcase
                      for name, s in pycompat.iteritems(self._map):
                          if s[0] != b'r':
                              f[normcase(name)] = name
                      f[b'.'] = b'.'  # prevents useless util.fspath() invocation
                      return f
                  def hastrackeddir(self, d):
                      """
                      Returns True if the dirstate contains a tracked (not removed) file
                      in this directory.
                      """
                      return d in self._dirs
                  def hasdir(self, d):
                      """
                      Returns True if the dirstate contains a file (tracked or removed)
                      in this directory.
                      """
                      return d in self._alldirs
                  @propertycache
                  def _dirs(self):
                      return pathutil.dirs(self._map, b'r')
                  @propertycache
                  def _alldirs(self):
                      return pathutil.dirs(self._map)
                  def _opendirstatefile(self):
                      fp, mode = txnutil.trypending(self._root, self._opener, self._filename)
                      if self._pendingmode is not None and self._pendingmode != mode:
                          fp.close()
                          raise error.Abort(
                              _(b'working directory state may be changed parallelly')
                          )
                      self._pendingmode = mode
                      return fp
                  def parents(self):
                      if not self._parents:
                          try:
                              fp = self._opendirstatefile()
                              st = fp.read(2 * self._nodelen)
                              fp.close()
                          except IOError as err:
                              if err.errno != errno.ENOENT:
                                  raise
                              # File doesn't exist, so the current state is empty
                              st = b''
                          l = len(st)
                          if l == self._nodelen * 2:
                              self._parents = (
                                  st[: self._nodelen],
                                  st[self._nodelen : 2 * self._nodelen],
                              )
                          elif l == 0:
                              self._parents = (
                                  self._nodeconstants.nullid,
                                  self._nodeconstants.nullid,
                              )
                          else:
                              raise error.Abort(
                                  _(b'working directory state appears damaged!')
                              )
                      return self._parents
                  def setparents(self, p1, p2):
                      self._parents = (p1, p2)
                      self._dirtyparents = True
                  def read(self):
                      # ignore HG_PENDING because identity is used only for writing
                      self.identity = util.filestat.frompath(
                          self._opener.join(self._filename)
                      )
                      try:
                          fp = self._opendirstatefile()
                          try:
                              st = fp.read()
                          finally:
                              fp.close()
                      except IOError as err:
                          if err.errno != errno.ENOENT:
                              raise
                          return
                      if not st:
                          return
                      if util.safehasattr(parsers, b'dict_new_presized'):
                          # Make an estimate of the number of files in the dirstate based on
                          # its size. This trades wasting some memory for avoiding costly
                          # resizes. Each entry have a prefix of 17 bytes followed by one or
                          # two path names. Studies on various large-scale real-world repositories
                          # found 54 bytes a reasonable upper limit for the average path names.
                          # Copy entries are ignored for the sake of this estimate.
                          self._map = parsers.dict_new_presized(len(st) // 71)
                      # Python's garbage collector triggers a GC each time a certain number
                      # of container objects (the number being defined by
                      # gc.get_threshold()) are allocated. parse_dirstate creates a tuple
                      # for each file in the dirstate. The C version then immediately marks
                      # them as not to be tracked by the collector. However, this has no
                      # effect on when GCs are triggered, only on what objects the GC looks
                      # into. This means that O(number of files) GCs are unavoidable.
                      # Depending on when in the process's lifetime the dirstate is parsed,
                      # this can get very expensive. As a workaround, disable GC while
                      # parsing the dirstate.
                      #
                      # (we cannot decorate the function directly since it is in a C module)
                      parse_dirstate = util.nogc(parsers.parse_dirstate)
                      p = parse_dirstate(self._map, self.copymap, st)
                      if not self._dirtyparents:
                          self.setparents(*p)
                      # Avoid excess attribute lookups by fast pathing certain checks
                      self.__contains__ = self._map.__contains__
                      self.__getitem__ = self._map.__getitem__
                      self.get = self._map.get
                  def write(self, st, now):
                      st.write(
                          parsers.pack_dirstate(self._map, self.copymap, self.parents(), now)
                      )
                      st.close()
                      self._dirtyparents = False
                      self.nonnormalset, self.otherparentset = self.nonnormalentries()
                  @propertycache
                  def nonnormalset(self):
                      nonnorm, otherparents = self.nonnormalentries()
                      self.otherparentset = otherparents
                      return nonnorm
                  @propertycache
                  def otherparentset(self):
                      nonnorm, otherparents = self.nonnormalentries()
                      self.nonnormalset = nonnorm
                      return otherparents
                  def non_normal_or_other_parent_paths(self):
                      return self.nonnormalset.union(self.otherparentset)
                  @propertycache
                  def identity(self):
                      self._map
                      return self.identity
                  @propertycache
                  def dirfoldmap(self):
                      f = {}
                      normcase = util.normcase
                      for name in self._dirs:
                          f[normcase(name)] = name
                      return f
              if rustmod is not None:
                  class dirstatemap(object):
                      def __init__(self, ui, opener, root, nodeconstants, use_dirstate_v2):
                          self._use_dirstate_v2 = use_dirstate_v2
                          self._nodeconstants = nodeconstants
                          self._ui = ui
                          self._opener = opener
                          self._root = root
                          self._filename = b'dirstate'
                          self._nodelen = 20  # Also update Rust code when changing this!
                          self._parents = None
                          self._dirtyparents = False
                          # for consistent view between _pl() and _read() invocations
                          self._pendingmode = None
                          self._use_dirstate_tree = self._ui.configbool(
                              b"experimental",
                              b"dirstate-tree.in-memory",
                              False,
                          )
                      def addfile(self, *args, **kwargs):
                          return self._rustmap.addfile(*args, **kwargs)
                      def removefile(self, *args, **kwargs):
                          return self._rustmap.removefile(*args, **kwargs)
                      def dropfile(self, *args, **kwargs):
                          return self._rustmap.dropfile(*args, **kwargs)
                      def clearambiguoustimes(self, *args, **kwargs):
                          return self._rustmap.clearambiguoustimes(*args, **kwargs)
                      def nonnormalentries(self):
                          return self._rustmap.nonnormalentries()
                      def get(self, *args, **kwargs):
                          return self._rustmap.get(*args, **kwargs)
                      @property
                      def copymap(self):
                          return self._rustmap.copymap()
                      def preload(self):
                          self._rustmap
                      def clear(self):
                          self._rustmap.clear()
                          self.setparents(
                              self._nodeconstants.nullid, self._nodeconstants.nullid
                          )
                          util.clearcachedproperty(self, b"_dirs")
                          util.clearcachedproperty(self, b"_alldirs")
                          util.clearcachedproperty(self, b"dirfoldmap")
                      def items(self):
                          return self._rustmap.items()
                      def keys(self):
                          return iter(self._rustmap)
                      def __contains__(self, key):
                          return key in self._rustmap
                      def __getitem__(self, item):
                          return self._rustmap[item]
                      def __len__(self):
                          return len(self._rustmap)
                      def __iter__(self):
                          return iter(self._rustmap)
                      # forward for python2,3 compat
                      iteritems = items
                      def _opendirstatefile(self):
                          fp, mode = txnutil.trypending(
                              self._root, self._opener, self._filename
                          )
                          if self._pendingmode is not None and self._pendingmode != mode:
                              fp.close()
                              raise error.Abort(
                                  _(b'working directory state may be changed parallelly')
                              )
                          self._pendingmode = mode
                          return fp
                      def setparents(self, p1, p2):
                          self._parents = (p1, p2)
                          self._dirtyparents = True
                      def parents(self):
                          if not self._parents:
                              if self._use_dirstate_v2:
                                  offset = len(rustmod.V2_FORMAT_MARKER)
                              else:
                                  offset = 0
                              read_len = offset + self._nodelen * 2
                              try:
                                  fp = self._opendirstatefile()
                                  st = fp.read(read_len)
                                  fp.close()
                              except IOError as err:
                                  if err.errno != errno.ENOENT:
                                      raise
                                  # File doesn't exist, so the current state is empty
                                  st = b''
                              l = len(st)
                              if l == read_len:
                                  st = st[offset:]
                                  self._parents = (
                                      st[: self._nodelen],
                                      st[self._nodelen : 2 * self._nodelen],
                                  )
                              elif l == 0:
                                  self._parents = (
                                      self._nodeconstants.nullid,
                                      self._nodeconstants.nullid,
                                  )
                              else:
                                  raise error.Abort(
                                      _(b'working directory state appears damaged!')
                                  )
                          return self._parents
                      @propertycache
                      def _rustmap(self):
                          """
                          Fills the Dirstatemap when called.
                          """
                          # ignore HG_PENDING because identity is used only for writing
                          self.identity = util.filestat.frompath(
                              self._opener.join(self._filename)
                          )
                          try:
                              fp = self._opendirstatefile()
                              try:
                                  st = fp.read()
                              finally:
                                  fp.close()
                          except IOError as err:
                              if err.errno != errno.ENOENT:
                                  raise
                              st = b''
                          self._rustmap, parents = rustmod.DirstateMap.new(
                              self._use_dirstate_tree, self._use_dirstate_v2, st
                          )
                          if parents and not self._dirtyparents:
                              self.setparents(*parents)
                          self.__contains__ = self._rustmap.__contains__
                          self.__getitem__ = self._rustmap.__getitem__
                          self.get = self._rustmap.get
                          return self._rustmap
                      def write(self, st, now):
                          parents = self.parents()
                          packed = self._rustmap.write(
                              self._use_dirstate_v2, parents[0], parents[1], now
                          )
                          st.write(packed)
                          st.close()
                          self._dirtyparents = False
                      @propertycache
                      def filefoldmap(self):
                          """Returns a dictionary mapping normalized case paths to their
                          non-normalized versions.
                          """
                          return self._rustmap.filefoldmapasdict()
                      def hastrackeddir(self, d):
                          self._dirs  # Trigger Python's propertycache
                          return self._rustmap.hastrackeddir(d)
                      def hasdir(self, d):
                          self._dirs  # Trigger Python's propertycache
                          return self._rustmap.hasdir(d)
                      @propertycache
                      def _dirs(self):
                          return self._rustmap.getdirs()
                      @propertycache
                      def _alldirs(self):
                          return self._rustmap.getalldirs()
                      @propertycache
                      def identity(self):
                          self._rustmap
                          return self.identity
                      @property
                      def nonnormalset(self):
                          nonnorm = self._rustmap.non_normal_entries()
                          return nonnorm
                      @propertycache
                      def otherparentset(self):
                          otherparents = self._rustmap.other_parent_entries()
                          return otherparents
                      def non_normal_or_other_parent_paths(self):
                          return self._rustmap.non_normal_or_other_parent_paths()
                      @propertycache
                      def dirfoldmap(self):
                          f = {}
                          normcase = util.normcase
                          for name in self._dirs:
                              f[normcase(name)] = name
                          return f

rust/hg-core/src/dirstate/status.rs

0 +5 0

              // status.rs
              //
              // Copyright 2019 Raphaël Gomès <rgomes@octobus.net>
              //
              // This software may be used and distributed according to the terms of the
              // GNU General Public License version 2 or any later version.
              //! Rust implementation of dirstate.status (dirstate.py).
              //! It is currently missing a lot of functionality compared to the Python one
              //! and will only be triggered in narrow cases.
              use crate::dirstate_tree::on_disk::DirstateV2ParseError;
              use crate::utils::path_auditor::PathAuditor;
              use crate::{
                  dirstate::SIZE_FROM_OTHER_PARENT,
                  filepatterns::PatternFileWarning,
                  matchers::{get_ignore_function, Matcher, VisitChildrenSet},
                  utils::{
                      files::{find_dirs, HgMetadata},
                      hg_path::{
                          hg_path_to_path_buf, os_string_to_hg_path_buf, HgPath, HgPathBuf,
                          HgPathError,
                      },
                  },
                  CopyMap, DirstateEntry, DirstateMap, EntryState, FastHashMap,
                  PatternError,
              };
              use lazy_static::lazy_static;
              use micro_timer::timed;
              use rayon::prelude::*;
              use std::{
                  borrow::Cow,
                  collections::HashSet,
                  fmt,
                  fs::{read_dir, DirEntry},
                  io::ErrorKind,
                  ops::Deref,
                  path::{Path, PathBuf},
              };
              /// Wrong type of file from a `BadMatch`
              /// Note: a lot of those don't exist on all platforms.
              #[derive(Debug, Copy, Clone)]
              pub enum BadType {
                  CharacterDevice,
                  BlockDevice,
                  FIFO,
                  Socket,
                  Directory,
                  Unknown,
              }
              impl fmt::Display for BadType {
                  fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
                      f.write_str(match self {
                          BadType::CharacterDevice => "character device",
                          BadType::BlockDevice => "block device",
                          BadType::FIFO => "fifo",
                          BadType::Socket => "socket",
                          BadType::Directory => "directory",
                          BadType::Unknown => "unknown",
                      })
                  }
              }
              /// Was explicitly matched but cannot be found/accessed
              #[derive(Debug, Copy, Clone)]
              pub enum BadMatch {
                  OsError(i32),
                  BadType(BadType),
              }
              /// Enum used to dispatch new status entries into the right collections.
              /// Is similar to `crate::EntryState`, but represents the transient state of
              /// entries during the lifetime of a command.
              #[derive(Debug, Copy, Clone)]
              pub enum Dispatch {
                  Unsure,
                  Modified,
                  Added,
                  Removed,
                  Deleted,
                  Clean,
                  Unknown,
                  Ignored,
                  /// Empty dispatch, the file is not worth listing
                  None,
                  /// Was explicitly matched but cannot be found/accessed
                  Bad(BadMatch),
                  Directory {
                      /// True if the directory used to be a file in the dmap so we can say
                      /// that it's been removed.
                      was_file: bool,
                  },
              }
              type IoResult<T> = std::io::Result<T>;
              /// `Box<dyn Trait>` is syntactic sugar for `Box<dyn Trait + 'static>`, so add
              /// an explicit lifetime here to not fight `'static` bounds "out of nowhere".
              pub type IgnoreFnType<'a> =
                  Box<dyn for<'r> Fn(&'r HgPath) -> bool + Sync + 'a>;
              /// We have a good mix of owned (from directory traversal) and borrowed (from
              /// the dirstate/explicit) paths, this comes up a lot.
              pub type HgPathCow<'a> = Cow<'a, HgPath>;
              /// A path with its computed ``Dispatch`` information
              type DispatchedPath<'a> = (HgPathCow<'a>, Dispatch);
              /// The conversion from `HgPath` to a real fs path failed.
              /// `22` is the error code for "Invalid argument"
              const INVALID_PATH_DISPATCH: Dispatch = Dispatch::Bad(BadMatch::OsError(22));
              /// Dates and times that are outside the 31-bit signed range are compared
              /// modulo 2^31. This should prevent hg from behaving badly with very large
              /// files or corrupt dates while still having a high probability of detecting
              /// changes. (issue2608)
              /// TODO I haven't found a way of having `b` be `Into<i32>`, since `From<u64>`
              /// is not defined for `i32`, and there is no `As` trait. This forces the
              /// caller to cast `b` as `i32`.
              fn mod_compare(a: i32, b: i32) -> bool {
                  a & i32::max_value() != b & i32::max_value()
              }
              /// Return a sorted list containing information about the entries
              /// in the directory.
              ///
              /// * `skip_dot_hg` - Return an empty vec if `path` contains a `.hg` directory
              fn list_directory(
                  path: impl AsRef<Path>,
                  skip_dot_hg: bool,
              ) -> std::io::Result<Vec<(HgPathBuf, DirEntry)>> {
                  let mut results = vec![];
                  let entries = read_dir(path.as_ref())?;
                  for entry in entries {
                      let entry = entry?;
                      let filename = os_string_to_hg_path_buf(entry.file_name())?;
                      let file_type = entry.file_type()?;
                      if skip_dot_hg && filename.as_bytes() == b".hg" && file_type.is_dir() {
                          return Ok(vec![]);
                      } else {
                          results.push((filename, entry))
                      }
                  }
                  results.sort_unstable_by_key(|e| e.0.clone());
                  Ok(results)
              }
              /// The file corresponding to the dirstate entry was found on the filesystem.
              fn dispatch_found(
                  filename: impl AsRef<HgPath>,
                  entry: DirstateEntry,
                  metadata: HgMetadata,
                  copy_map: &CopyMap,
                  options: StatusOptions,
              ) -> Dispatch {
                  let DirstateEntry {
                      state,
                      mode,
                      mtime,
                      size,
                  } = entry;
                  let HgMetadata {
                      st_mode,
                      st_size,
                      st_mtime,
                      ..
                  } = metadata;
                  match state {
                      EntryState::Normal => {
                          let size_changed = mod_compare(size, st_size as i32);
                          let mode_changed =
                              (mode ^ st_mode as i32) & 0o100 != 0o000 && options.check_exec;
                          let metadata_changed = size >= 0 && (size_changed || mode_changed);
                          let other_parent = size == SIZE_FROM_OTHER_PARENT;
                          if metadata_changed
                              || other_parent
                              || copy_map.contains_key(filename.as_ref())
                          {
                              if metadata.is_symlink() && size_changed {
                                  // issue6456: Size returned may be longer due to encryption
                                  // on EXT-4 fscrypt. TODO maybe only do it on EXT4?
                                  Dispatch::Unsure
                              } else {
                                  Dispatch::Modified
                              }
                          } else if mod_compare(mtime, st_mtime as i32)
                              || st_mtime == options.last_normal_time
                          {
                              // the file may have just been marked as normal and
                              // it may have changed in the same second without
                              // changing its size. This can happen if we quickly
                              // do multiple commits. Force lookup, so we don't
                              // miss such a racy file change.
                              Dispatch::Unsure
                          } else if options.list_clean {
                              Dispatch::Clean
                          } else {
                              Dispatch::None
                          }
                      }
                      EntryState::Merged => Dispatch::Modified,
                      EntryState::Added => Dispatch::Added,
                      EntryState::Removed => Dispatch::Removed,
                      EntryState::Unknown => Dispatch::Unknown,
                  }
              }
              /// The file corresponding to this Dirstate entry is missing.
              fn dispatch_missing(state: EntryState) -> Dispatch {
                  match state {
                      // File was removed from the filesystem during commands
                      EntryState::Normal | EntryState::Merged | EntryState::Added => {
                          Dispatch::Deleted
                      }
                      // File was removed, everything is normal
                      EntryState::Removed => Dispatch::Removed,
                      // File is unknown to Mercurial, everything is normal
                      EntryState::Unknown => Dispatch::Unknown,
                  }
              }
              fn dispatch_os_error(e: &std::io::Error) -> Dispatch {
                  Dispatch::Bad(BadMatch::OsError(
                      e.raw_os_error().expect("expected real OS error"),
                  ))
              }
              lazy_static! {
                  static ref DEFAULT_WORK: HashSet<&'static HgPath> = {
                      let mut h = HashSet::new();
                      h.insert(HgPath::new(b""));
                      h
                  };
              }
              #[derive(Debug, Copy, Clone)]
              pub struct StatusOptions {
                  /// Remember the most recent modification timeslot for status, to make
                  /// sure we won't miss future size-preserving file content modifications
                  /// that happen within the same timeslot.
                  pub last_normal_time: i64,
                  /// Whether we are on a filesystem with UNIX-like exec flags
                  pub check_exec: bool,
                  pub list_clean: bool,
                  pub list_unknown: bool,
                  pub list_ignored: bool,
                  /// Whether to collect traversed dirs for applying a callback later.
                  /// Used by `hg purge` for example.
                  pub collect_traversed_dirs: bool,
              }
              #[derive(Debug, Default)]
              pub struct DirstateStatus<'a> {
                  /// Tracked files whose contents have changed since the parent revision
                  pub modified: Vec<HgPathCow<'a>>,
                  /// Newly-tracked files that were not present in the parent
                  pub added: Vec<HgPathCow<'a>>,
                  /// Previously-tracked files that have been (re)moved with an hg command
                  pub removed: Vec<HgPathCow<'a>>,
                  /// (Still) tracked files that are missing, (re)moved with an non-hg
                  /// command
                  pub deleted: Vec<HgPathCow<'a>>,
                  /// Tracked files that are up to date with the parent.
                  /// Only pupulated if `StatusOptions::list_clean` is true.
                  pub clean: Vec<HgPathCow<'a>>,
                  /// Files in the working directory that are ignored with `.hgignore`.
                  /// Only pupulated if `StatusOptions::list_ignored` is true.
                  pub ignored: Vec<HgPathCow<'a>>,
                  /// Files in the working directory that are neither tracked nor ignored.
                  /// Only pupulated if `StatusOptions::list_unknown` is true.
                  pub unknown: Vec<HgPathCow<'a>>,
                  /// Was explicitly matched but cannot be found/accessed
                  pub bad: Vec<(HgPathCow<'a>, BadMatch)>,
                  /// Either clean or modified, but we can’t tell from filesystem metadata
                  /// alone. The file contents need to be read and compared with that in
                  /// the parent.
                  pub unsure: Vec<HgPathCow<'a>>,
                  /// Only filled if `collect_traversed_dirs` is `true`
                  pub traversed: Vec<HgPathCow<'a>>,
+                 /// Whether `status()` made changed to the `DirstateMap` that should be
+                 /// written back to disk
+                 pub dirty: bool,
              }
              #[derive(Debug, derive_more::From)]
              pub enum StatusError {
                  /// Generic IO error
                  IO(std::io::Error),
                  /// An invalid path that cannot be represented in Mercurial was found
                  Path(HgPathError),
                  /// An invalid "ignore" pattern was found
                  Pattern(PatternError),
                  /// Corrupted dirstate
                  DirstateV2ParseError(DirstateV2ParseError),
              }
              pub type StatusResult<T> = Result<T, StatusError>;
              impl fmt::Display for StatusError {
                  fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
                      match self {
                          StatusError::IO(error) => error.fmt(f),
                          StatusError::Path(error) => error.fmt(f),
                          StatusError::Pattern(error) => error.fmt(f),
                          StatusError::DirstateV2ParseError(_) => {
                              f.write_str("dirstate-v2 parse error")
                          }
                      }
                  }
              }
              /// Gives information about which files are changed in the working directory
              /// and how, compared to the revision we're based on
              pub struct Status<'a, M: ?Sized + Matcher + Sync> {
                  dmap: &'a DirstateMap,
                  pub(crate) matcher: &'a M,
                  root_dir: PathBuf,
                  pub(crate) options: StatusOptions,
                  ignore_fn: IgnoreFnType<'a>,
              }
              impl<'a, M> Status<'a, M>
              where
                  M: ?Sized + Matcher + Sync,
              {
                  pub fn new(
                      dmap: &'a DirstateMap,
                      matcher: &'a M,
                      root_dir: PathBuf,
                      ignore_files: Vec<PathBuf>,
                      options: StatusOptions,
                  ) -> StatusResult<(Self, Vec<PatternFileWarning>)> {
                      // Needs to outlive `dir_ignore_fn` since it's captured.
                      let (ignore_fn, warnings): (IgnoreFnType, _) =
                          if options.list_ignored || options.list_unknown {
                              get_ignore_function(ignore_files, &root_dir)?
                          } else {
                              (Box::new(|&_| true), vec![])
                          };
                      Ok((
                          Self {
                              dmap,
                              matcher,
                              root_dir,
                              options,
                              ignore_fn,
                          },
                          warnings,
                      ))
                  }
                  /// Is the path ignored?
                  pub fn is_ignored(&self, path: impl AsRef<HgPath>) -> bool {
                      (self.ignore_fn)(path.as_ref())
                  }
                  /// Is the path or one of its ancestors ignored?
                  pub fn dir_ignore(&self, dir: impl AsRef<HgPath>) -> bool {
                      // Only involve ignore mechanism if we're listing unknowns or ignored.
                      if self.options.list_ignored || self.options.list_unknown {
                          if self.is_ignored(&dir) {
                              true
                          } else {
                              for p in find_dirs(dir.as_ref()) {
                                  if self.is_ignored(p) {
                                      return true;
                                  }
                              }
                              false
                          }
                      } else {
                          true
                      }
                  }
                  /// Get stat data about the files explicitly specified by the matcher.
                  /// Returns a tuple of the directories that need to be traversed and the
                  /// files with their corresponding `Dispatch`.
                  /// TODO subrepos
                  #[timed]
                  pub fn walk_explicit(
                      &self,
                      traversed_sender: crossbeam_channel::Sender<HgPathBuf>,
                  ) -> (Vec<DispatchedPath<'a>>, Vec<DispatchedPath<'a>>) {
                      self.matcher
                          .file_set()
                          .unwrap_or(&DEFAULT_WORK)
                          .par_iter()
                          .flat_map(|&filename| -> Option<_> {
                              // TODO normalization
                              let normalized = filename;
                              let buf = match hg_path_to_path_buf(normalized) {
                                  Ok(x) => x,
                                  Err(_) => {
                                      return Some((
                                          Cow::Borrowed(normalized),
                                          INVALID_PATH_DISPATCH,
                                      ))
                                  }
                              };
                              let target = self.root_dir.join(buf);
                              let st = target.symlink_metadata();
                              let in_dmap = self.dmap.get(normalized);
                              match st {
                                  Ok(meta) => {
                                      let file_type = meta.file_type();
                                      return if file_type.is_file() || file_type.is_symlink()
                                      {
                                          if let Some(entry) = in_dmap {
                                              return Some((
                                                  Cow::Borrowed(normalized),
                                                  dispatch_found(
                                                      &normalized,
                                                      *entry,
                                                      HgMetadata::from_metadata(meta),
                                                      &self.dmap.copy_map,
                                                      self.options,
                                                  ),
                                              ));
                                          }
                                          Some((
                                              Cow::Borrowed(normalized),
                                              Dispatch::Unknown,
                                          ))
                                      } else if file_type.is_dir() {
                                          if self.options.collect_traversed_dirs {
                                              traversed_sender
                                                  .send(normalized.to_owned())
                                                  .expect("receiver should outlive sender");
                                          }
                                          Some((
                                              Cow::Borrowed(normalized),
                                              Dispatch::Directory {
                                                  was_file: in_dmap.is_some(),
                                              },
                                          ))
                                      } else {
                                          Some((
                                              Cow::Borrowed(normalized),
                                              Dispatch::Bad(BadMatch::BadType(
                                                  // TODO do more than unknown
                                                  // Support for all `BadType` variant
                                                  // varies greatly between platforms.
                                                  // So far, no tests check the type and
                                                  // this should be good enough for most
                                                  // users.
                                                  BadType::Unknown,
                                              )),
                                          ))
                                      };
                                  }
                                  Err(_) => {
                                      if let Some(entry) = in_dmap {
                                          return Some((
                                              Cow::Borrowed(normalized),
                                              dispatch_missing(entry.state),
                                          ));
                                      }
                                  }
                              };
                              None
                          })
                          .partition(|(_, dispatch)| match dispatch {
                              Dispatch::Directory { .. } => true,
                              _ => false,
                          })
                  }
                  /// Walk the working directory recursively to look for changes compared to
                  /// the current `DirstateMap`.
                  ///
                  /// This takes a mutable reference to the results to account for the
                  /// `extend` in timings
                  #[timed]
                  pub fn traverse(
                      &self,
                      path: impl AsRef<HgPath>,
                      old_results: &FastHashMap<HgPathCow<'a>, Dispatch>,
                      results: &mut Vec<DispatchedPath<'a>>,
                      traversed_sender: crossbeam_channel::Sender<HgPathBuf>,
                  ) {
                      // The traversal is done in parallel, so use a channel to gather
                      // entries. `crossbeam_channel::Sender` is `Sync`, while `mpsc::Sender`
                      // is not.
                      let (files_transmitter, files_receiver) =
                          crossbeam_channel::unbounded();
                      self.traverse_dir(
                          &files_transmitter,
                          path,
                          &old_results,
                          traversed_sender,
                      );
                      // Disconnect the channel so the receiver stops waiting
                      drop(files_transmitter);
                      let new_results = files_receiver
                          .into_iter()
                          .par_bridge()
                          .map(|(f, d)| (Cow::Owned(f), d));
                      results.par_extend(new_results);
                  }
                  /// Dispatch a single entry (file, folder, symlink...) found during
                  /// `traverse`. If the entry is a folder that needs to be traversed, it
                  /// will be handled in a separate thread.
                  fn handle_traversed_entry<'b>(
                      &'a self,
                      scope: &rayon::Scope<'b>,
                      files_sender: &'b crossbeam_channel::Sender<(HgPathBuf, Dispatch)>,
                      old_results: &'a FastHashMap<Cow<HgPath>, Dispatch>,
                      filename: HgPathBuf,
                      dir_entry: DirEntry,
                      traversed_sender: crossbeam_channel::Sender<HgPathBuf>,
                  ) -> IoResult<()>
                  where
                      'a: 'b,
                  {
                      let file_type = dir_entry.file_type()?;
                      let entry_option = self.dmap.get(&filename);
                      if filename.as_bytes() == b".hg" {
                          // Could be a directory or a symlink
                          return Ok(());
                      }
                      if file_type.is_dir() {
                          self.handle_traversed_dir(
                              scope,
                              files_sender,
                              old_results,
                              entry_option,
                              filename,
                              traversed_sender,
                          );
                      } else if file_type.is_file() || file_type.is_symlink() {
                          if let Some(entry) = entry_option {
                              if self.matcher.matches_everything()
                                  || self.matcher.matches(&filename)
                              {
                                  let metadata = dir_entry.metadata()?;
                                  files_sender
                                      .send((
                                          filename.to_owned(),
                                          dispatch_found(
                                              &filename,
                                              *entry,
                                              HgMetadata::from_metadata(metadata),
                                              &self.dmap.copy_map,
                                              self.options,
                                          ),
                                      ))
                                      .unwrap();
                              }
                          } else if (self.matcher.matches_everything()
                              || self.matcher.matches(&filename))
                              && !self.is_ignored(&filename)
                          {
                              if (self.options.list_ignored
                                  || self.matcher.exact_match(&filename))
                                  && self.dir_ignore(&filename)
                              {
                                  if self.options.list_ignored {
                                      files_sender
                                          .send((filename.to_owned(), Dispatch::Ignored))
                                          .unwrap();
                                  }
                              } else if self.options.list_unknown {
                                  files_sender
                                      .send((filename.to_owned(), Dispatch::Unknown))
                                      .unwrap();
                              }
                          } else if self.is_ignored(&filename) && self.options.list_ignored {
                              if self.matcher.matches(&filename) {
                                  files_sender
                                      .send((filename.to_owned(), Dispatch::Ignored))
                                      .unwrap();
                              }
                          }
                      } else if let Some(entry) = entry_option {
                          // Used to be a file or a folder, now something else.
                          if self.matcher.matches_everything()
                              || self.matcher.matches(&filename)
                          {
                              files_sender
                                  .send((filename.to_owned(), dispatch_missing(entry.state)))
                                  .unwrap();
                          }
                      }
                      Ok(())
                  }
                  /// A directory was found in the filesystem and needs to be traversed
                  fn handle_traversed_dir<'b>(
                      &'a self,
                      scope: &rayon::Scope<'b>,
                      files_sender: &'b crossbeam_channel::Sender<(HgPathBuf, Dispatch)>,
                      old_results: &'a FastHashMap<Cow<HgPath>, Dispatch>,
                      entry_option: Option<&'a DirstateEntry>,
                      directory: HgPathBuf,
                      traversed_sender: crossbeam_channel::Sender<HgPathBuf>,
                  ) where
                      'a: 'b,
                  {
                      scope.spawn(move |_| {
                          // Nested `if` until `rust-lang/rust#53668` is stable
                          if let Some(entry) = entry_option {
                              // Used to be a file, is now a folder
                              if self.matcher.matches_everything()
                                  || self.matcher.matches(&directory)
                              {
                                  files_sender
                                      .send((
                                          directory.to_owned(),
                                          dispatch_missing(entry.state),
                                      ))
                                      .unwrap();
                              }
                          }
                          // Do we need to traverse it?
                          if !self.is_ignored(&directory) || self.options.list_ignored {
                              self.traverse_dir(
                                  files_sender,
                                  directory,
                                  &old_results,
                                  traversed_sender,
                              )
                          }
                      });
                  }
                  /// Decides whether the directory needs to be listed, and if so handles the
                  /// entries in a separate thread.
                  fn traverse_dir(
                      &self,
                      files_sender: &crossbeam_channel::Sender<(HgPathBuf, Dispatch)>,
                      directory: impl AsRef<HgPath>,
                      old_results: &FastHashMap<Cow<HgPath>, Dispatch>,
                      traversed_sender: crossbeam_channel::Sender<HgPathBuf>,
                  ) {
                      let directory = directory.as_ref();
                      if self.options.collect_traversed_dirs {
                          traversed_sender
                              .send(directory.to_owned())
                              .expect("receiver should outlive sender");
                      }
                      let visit_entries = match self.matcher.visit_children_set(directory) {
                          VisitChildrenSet::Empty => return,
                          VisitChildrenSet::This | VisitChildrenSet::Recursive => None,
                          VisitChildrenSet::Set(set) => Some(set),
                      };
                      let buf = match hg_path_to_path_buf(directory) {
                          Ok(b) => b,
                          Err(_) => {
                              files_sender
                                  .send((directory.to_owned(), INVALID_PATH_DISPATCH))
                                  .expect("receiver should outlive sender");
                              return;
                          }
                      };
                      let dir_path = self.root_dir.join(buf);
                      let skip_dot_hg = !directory.as_bytes().is_empty();
                      let entries = match list_directory(dir_path, skip_dot_hg) {
                          Err(e) => {
                              files_sender
                                  .send((directory.to_owned(), dispatch_os_error(&e)))
                                  .expect("receiver should outlive sender");
                              return;
                          }
                          Ok(entries) => entries,
                      };
                      rayon::scope(|scope| {
                          for (filename, dir_entry) in entries {
                              if let Some(ref set) = visit_entries {
                                  if !set.contains(filename.deref()) {
                                      continue;
                                  }
                              }
                              // TODO normalize
                              let filename = if directory.is_empty() {
                                  filename.to_owned()
                              } else {
                                  directory.join(&filename)
                              };
                              if !old_results.contains_key(filename.deref()) {
                                  match self.handle_traversed_entry(
                                      scope,
                                      files_sender,
                                      old_results,
                                      filename,
                                      dir_entry,
                                      traversed_sender.clone(),
                                  ) {
                                      Err(e) => {
                                          files_sender
                                              .send((
                                                  directory.to_owned(),
                                                  dispatch_os_error(&e),
                                              ))
                                              .expect("receiver should outlive sender");
                                      }
                                      Ok(_) => {}
                                  }
                              }
                          }
                      })
                  }
                  /// Add the files in the dirstate to the results.
                  ///
                  /// This takes a mutable reference to the results to account for the
                  /// `extend` in timings
                  #[timed]
                  pub fn extend_from_dmap(&self, results: &mut Vec<DispatchedPath<'a>>) {
                      results.par_extend(
                          self.dmap
                              .par_iter()
                              .filter(|(path, _)| self.matcher.matches(path))
                              .map(move |(filename, entry)| {
                                  let filename: &HgPath = filename;
                                  let filename_as_path = match hg_path_to_path_buf(filename)
                                  {
                                      Ok(f) => f,
                                      Err(_) => {
                                          return (
                                              Cow::Borrowed(filename),
                                              INVALID_PATH_DISPATCH,
                                          )
                                      }
                                  };
                                  let meta = self
                                      .root_dir
                                      .join(filename_as_path)
                                      .symlink_metadata();
                                  match meta {
                                      Ok(m)
                                          if !(m.file_type().is_file()
                                              || m.file_type().is_symlink()) =>
                                      {
                                          (
                                              Cow::Borrowed(filename),
                                              dispatch_missing(entry.state),
                                          )
                                      }
                                      Ok(m) => (
                                          Cow::Borrowed(filename),
                                          dispatch_found(
                                              filename,
                                              *entry,
                                              HgMetadata::from_metadata(m),
                                              &self.dmap.copy_map,
                                              self.options,
                                          ),
                                      ),
                                      Err(e)
                                          if e.kind() == ErrorKind::NotFound
                                              || e.raw_os_error() == Some(20) =>
                                      {
                                          // Rust does not yet have an `ErrorKind` for
                                          // `NotADirectory` (errno 20)
                                          // It happens if the dirstate contains `foo/bar`
                                          // and foo is not a
                                          // directory
                                          (
                                              Cow::Borrowed(filename),
                                              dispatch_missing(entry.state),
                                          )
                                      }
                                      Err(e) => {
                                          (Cow::Borrowed(filename), dispatch_os_error(&e))
                                      }
                                  }
                              }),
                      );
                  }
                  /// Checks all files that are in the dirstate but were not found during the
                  /// working directory traversal. This means that the rest must
                  /// be either ignored, under a symlink or under a new nested repo.
                  ///
                  /// This takes a mutable reference to the results to account for the
                  /// `extend` in timings
                  #[timed]
                  pub fn handle_unknowns(&self, results: &mut Vec<DispatchedPath<'a>>) {
                      let to_visit: Vec<(&HgPath, &DirstateEntry)> =
                          if results.is_empty() && self.matcher.matches_everything() {
                              self.dmap.iter().map(|(f, e)| (f.deref(), e)).collect()
                          } else {
                              // Only convert to a hashmap if needed.
                              let old_results: FastHashMap<_, _> =
                                  results.iter().cloned().collect();
                              self.dmap
                                  .iter()
                                  .filter_map(move |(f, e)| {
                                      if !old_results.contains_key(f.deref())
                                          && self.matcher.matches(f)
                                      {
                                          Some((f.deref(), e))
                                      } else {
                                          None
                                      }
                                  })
                                  .collect()
                          };
                      let path_auditor = PathAuditor::new(&self.root_dir);
                      let new_results = to_visit.into_par_iter().filter_map(
                          |(filename, entry)| -> Option<_> {
                              // Report ignored items in the dmap as long as they are not
                              // under a symlink directory.
                              if path_auditor.check(filename) {
                                  // TODO normalize for case-insensitive filesystems
                                  let buf = match hg_path_to_path_buf(filename) {
                                      Ok(x) => x,
                                      Err(_) => {
                                          return Some((
                                              Cow::Owned(filename.to_owned()),
                                              INVALID_PATH_DISPATCH,
                                          ));
                                      }
                                  };
                                  Some((
                                      Cow::Owned(filename.to_owned()),
                                      match self.root_dir.join(&buf).symlink_metadata() {
                                          // File was just ignored, no links, and exists
                                          Ok(meta) => {
                                              let metadata = HgMetadata::from_metadata(meta);
                                              dispatch_found(
                                                  filename,
                                                  *entry,
                                                  metadata,
                                                  &self.dmap.copy_map,
                                                  self.options,
                                              )
                                          }
                                          // File doesn't exist
                                          Err(_) => dispatch_missing(entry.state),
                                      },
                                  ))
                              } else {
                                  // It's either missing or under a symlink directory which
                                  // we, in this case, report as missing.
                                  Some((
                                      Cow::Owned(filename.to_owned()),
                                      dispatch_missing(entry.state),
                                  ))
                              }
                          },
                      );
                      results.par_extend(new_results);
                  }
              }
              #[timed]
              pub fn build_response<'a>(
                  results: impl IntoIterator<Item = DispatchedPath<'a>>,
                  traversed: Vec<HgPathCow<'a>>,
              ) -> DirstateStatus<'a> {
                  let mut unsure = vec![];
                  let mut modified = vec![];
                  let mut added = vec![];
                  let mut removed = vec![];
                  let mut deleted = vec![];
                  let mut clean = vec![];
                  let mut ignored = vec![];
                  let mut unknown = vec![];
                  let mut bad = vec![];
                  for (filename, dispatch) in results.into_iter() {
                      match dispatch {
                          Dispatch::Unknown => unknown.push(filename),
                          Dispatch::Unsure => unsure.push(filename),
                          Dispatch::Modified => modified.push(filename),
                          Dispatch::Added => added.push(filename),
                          Dispatch::Removed => removed.push(filename),
                          Dispatch::Deleted => deleted.push(filename),
                          Dispatch::Clean => clean.push(filename),
                          Dispatch::Ignored => ignored.push(filename),
                          Dispatch::None => {}
                          Dispatch::Bad(reason) => bad.push((filename, reason)),
                          Dispatch::Directory { .. } => {}
                      }
                  }
                  DirstateStatus {
                      modified,
                      added,
                      removed,
                      deleted,
                      clean,
                      ignored,
                      unknown,
                      bad,
                      unsure,
                      traversed,
+                     dirty: false,
                  }
              }
              /// Get the status of files in the working directory.
              ///
              /// This is the current entry-point for `hg-core` and is realistically unusable
              /// outside of a Python context because its arguments need to provide a lot of
              /// information that will not be necessary in the future.
              #[timed]
              pub fn status<'a>(
                  dmap: &'a DirstateMap,
                  matcher: &'a (dyn Matcher + Sync),
                  root_dir: PathBuf,
                  ignore_files: Vec<PathBuf>,
                  options: StatusOptions,
              ) -> StatusResult<(DirstateStatus<'a>, Vec<PatternFileWarning>)> {
                  let (status, warnings) =
                      Status::new(dmap, matcher, root_dir, ignore_files, options)?;
                  Ok((status.run()?, warnings))
              }

rust/hg-core/src/dirstate_tree/status.rs

0 +2 -1

              use crate::dirstate::status::IgnoreFnType;
              use crate::dirstate_tree::dirstate_map::BorrowedPath;
              use crate::dirstate_tree::dirstate_map::ChildNodesRef;
              use crate::dirstate_tree::dirstate_map::DirstateMap;
              use crate::dirstate_tree::dirstate_map::NodeData;
              use crate::dirstate_tree::dirstate_map::NodeRef;
              use crate::dirstate_tree::on_disk::DirstateV2ParseError;
              use crate::dirstate_tree::on_disk::Timestamp;
              use crate::dirstate_tree::path_with_basename::WithBasename;
              use crate::matchers::get_ignore_function;
              use crate::matchers::Matcher;
              use crate::utils::files::get_bytes_from_os_string;
              use crate::utils::files::get_path_from_bytes;
              use crate::utils::hg_path::HgPath;
              use crate::BadMatch;
              use crate::DirstateStatus;
              use crate::EntryState;
              use crate::HgPathBuf;
              use crate::PatternFileWarning;
              use crate::StatusError;
              use crate::StatusOptions;
              use micro_timer::timed;
              use rayon::prelude::*;
              use std::borrow::Cow;
              use std::io;
              use std::path::Path;
              use std::path::PathBuf;
              use std::sync::Mutex;
              use std::time::SystemTime;
              /// Returns the status of the working directory compared to its parent
              /// changeset.
              ///
              /// This algorithm is based on traversing the filesystem tree (`fs` in function
              /// and variable names) and dirstate tree at the same time. The core of this
              /// traversal is the recursive `traverse_fs_directory_and_dirstate` function
              /// and its use of `itertools::merge_join_by`. When reaching a path that only
              /// exists in one of the two trees, depending on information requested by
              /// `options` we may need to traverse the remaining subtree.
              #[timed]
              pub fn status<'tree, 'on_disk: 'tree>(
                  dmap: &'tree mut DirstateMap<'on_disk>,
                  matcher: &(dyn Matcher + Sync),
                  root_dir: PathBuf,
                  ignore_files: Vec<PathBuf>,
                  options: StatusOptions,
              ) -> Result<(DirstateStatus<'on_disk>, Vec<PatternFileWarning>), StatusError> {
                  let (ignore_fn, warnings): (IgnoreFnType, _) =
                      if options.list_ignored || options.list_unknown {
                          get_ignore_function(ignore_files, &root_dir)?
                      } else {
                          (Box::new(|&_| true), vec![])
                      };
                  let common = StatusCommon {
                      dmap,
                      options,
                      matcher,
                      ignore_fn,
                      outcome: Default::default(),
                      cached_directory_mtimes_to_add: Default::default(),
                      filesystem_time_at_status_start: filesystem_now(&root_dir).ok(),
                  };
                  let is_at_repo_root = true;
                  let hg_path = &BorrowedPath::OnDisk(HgPath::new(""));
                  let has_ignored_ancestor = false;
                  let root_cached_mtime = None;
                  let root_dir_metadata = None;
                  // If the path we have for the repository root is a symlink, do follow it.
                  // (As opposed to symlinks within the working directory which are not
                  // followed, using `std::fs::symlink_metadata`.)
                  common.traverse_fs_directory_and_dirstate(
                      has_ignored_ancestor,
                      dmap.root.as_ref(),
                      hg_path,
                      &root_dir,
                      root_dir_metadata,
                      root_cached_mtime,
                      is_at_repo_root,
                  )?;
-                 let outcome = common.outcome.into_inner().unwrap();
+                 let mut outcome = common.outcome.into_inner().unwrap();
                  let to_add = common.cached_directory_mtimes_to_add.into_inner().unwrap();
+                 outcome.dirty = !to_add.is_empty();
                  for (path, mtime) in &to_add {
                      let node = DirstateMap::get_or_insert_node(
                          dmap.on_disk,
                          &mut dmap.root,
                          path,
                          WithBasename::to_cow_owned,
                          |_| {},
                      )?;
                      match &node.data {
                          NodeData::Entry(_) => {} // Don’t overwrite an entry
                          NodeData::CachedDirectory { .. } | NodeData::None => {
                              node.data = NodeData::CachedDirectory { mtime: *mtime }
                          }
                      }
                  }
                  Ok((outcome, warnings))
              }
              /// Bag of random things needed by various parts of the algorithm. Reduces the
              /// number of parameters passed to functions.
              struct StatusCommon<'a, 'tree, 'on_disk: 'tree> {
                  dmap: &'tree DirstateMap<'on_disk>,
                  options: StatusOptions,
                  matcher: &'a (dyn Matcher + Sync),
                  ignore_fn: IgnoreFnType<'a>,
                  outcome: Mutex<DirstateStatus<'on_disk>>,
                  cached_directory_mtimes_to_add:
                      Mutex<Vec<(Cow<'on_disk, HgPath>, Timestamp)>>,
                  /// The current time at the start of the `status()` algorithm, as measured
                  /// and possibly truncated by the filesystem.
                  filesystem_time_at_status_start: Option<SystemTime>,
              }
              impl<'a, 'tree, 'on_disk> StatusCommon<'a, 'tree, 'on_disk> {
                  fn read_dir(
                      &self,
                      hg_path: &HgPath,
                      fs_path: &Path,
                      is_at_repo_root: bool,
                  ) -> Result<Vec<DirEntry>, ()> {
                      DirEntry::read_dir(fs_path, is_at_repo_root)
                          .map_err(|error| self.io_error(error, hg_path))
                  }
                  fn io_error(&self, error: std::io::Error, hg_path: &HgPath) {
                      let errno = error.raw_os_error().expect("expected real OS error");
                      self.outcome
                          .lock()
                          .unwrap()
                          .bad
                          .push((hg_path.to_owned().into(), BadMatch::OsError(errno)))
                  }
                  /// If this returns true, we can get accurate results by only using
                  /// `symlink_metadata` for child nodes that exist in the dirstate and don’t
                  /// need to call `read_dir`.
                  fn can_skip_fs_readdir(
                      &self,
                      directory_metadata: Option<&std::fs::Metadata>,
                      cached_directory_mtime: Option<&Timestamp>,
                  ) -> bool {
                      if !self.options.list_unknown && !self.options.list_ignored {
                          // All states that we care about listing have corresponding
                          // dirstate entries.
                          // This happens for example with `hg status -mard`.
                          return true;
                      }
                      if let Some(cached_mtime) = cached_directory_mtime {
                          // The dirstate contains a cached mtime for this directory, set by
                          // a previous run of the `status` algorithm which found this
                          // directory eligible for `read_dir` caching.
                          if let Some(meta) = directory_metadata {
                              if let Ok(current_mtime) = meta.modified() {
                                  if current_mtime == cached_mtime.into() {
                                      // The mtime of that directory has not changed since
                                      // then, which means that the
                                      // results of `read_dir` should also
                                      // be unchanged.
                                      return true;
                                  }
                              }
                          }
                      }
                      false
                  }
                  /// Returns whether the filesystem directory was found to have any entry
                  /// that does not have a corresponding dirstate tree node.
                  fn traverse_fs_directory_and_dirstate(
                      &self,
                      has_ignored_ancestor: bool,
                      dirstate_nodes: ChildNodesRef<'tree, 'on_disk>,
                      directory_hg_path: &BorrowedPath<'tree, 'on_disk>,
                      directory_fs_path: &Path,
                      directory_metadata: Option<&std::fs::Metadata>,
                      cached_directory_mtime: Option<&Timestamp>,
                      is_at_repo_root: bool,
                  ) -> Result<bool, DirstateV2ParseError> {
                      if self.can_skip_fs_readdir(directory_metadata, cached_directory_mtime)
                      {
                          dirstate_nodes
                              .par_iter()
                              .map(|dirstate_node| {
                                  let fs_path = directory_fs_path.join(get_path_from_bytes(
                                      dirstate_node.base_name(self.dmap.on_disk)?.as_bytes(),
                                  ));
                                  match std::fs::symlink_metadata(&fs_path) {
                                      Ok(fs_metadata) => self.traverse_fs_and_dirstate(
                                          &fs_path,
                                          &fs_metadata,
                                          dirstate_node,
                                          has_ignored_ancestor,
                                      ),
                                      Err(e) if e.kind() == std::io::ErrorKind::NotFound => {
                                          self.traverse_dirstate_only(dirstate_node)
                                      }
                                      Err(error) => {
                                          let hg_path =
                                              dirstate_node.full_path(self.dmap.on_disk)?;
                                          Ok(self.io_error(error, hg_path))
                                      }
                                  }
                              })
                              .collect::<Result<_, _>>()?;
                          // Conservatively don’t let the caller assume that there aren’t
                          // any, since we don’t know.
                          let directory_has_any_fs_only_entry = true;
                          return Ok(directory_has_any_fs_only_entry);
                      }
                      let mut fs_entries = if let Ok(entries) = self.read_dir(
                          directory_hg_path,
                          directory_fs_path,
                          is_at_repo_root,
                      ) {
                          entries
                      } else {
                          // Treat an unreadable directory (typically because of insufficient
                          // permissions) like an empty directory. `self.read_dir` has
                          // already called `self.io_error` so a warning will be emitted.
                          Vec::new()
                      };
                      // `merge_join_by` requires both its input iterators to be sorted:
                      let dirstate_nodes = dirstate_nodes.sorted();
                      // `sort_unstable_by_key` doesn’t allow keys borrowing from the value:
                      // https://github.com/rust-lang/rust/issues/34162
                      fs_entries.sort_unstable_by(|e1, e2| e1.base_name.cmp(&e2.base_name));
                      // Propagate here any error that would happen inside the comparison
                      // callback below
                      for dirstate_node in &dirstate_nodes {
                          dirstate_node.base_name(self.dmap.on_disk)?;
                      }
                      itertools::merge_join_by(
                          dirstate_nodes,
                          &fs_entries,
                          |dirstate_node, fs_entry| {
                              // This `unwrap` never panics because we already propagated
                              // those errors above
                              dirstate_node
                                  .base_name(self.dmap.on_disk)
                                  .unwrap()
                                  .cmp(&fs_entry.base_name)
                          },
                      )
                      .par_bridge()
                      .map(|pair| {
                          use itertools::EitherOrBoth::*;
                          let is_fs_only = pair.is_right();
                          match pair {
                              Both(dirstate_node, fs_entry) => self
                                  .traverse_fs_and_dirstate(
                                      &fs_entry.full_path,
                                      &fs_entry.metadata,
                                      dirstate_node,
                                      has_ignored_ancestor,
                                  )?,
                              Left(dirstate_node) => {
                                  self.traverse_dirstate_only(dirstate_node)?
                              }
                              Right(fs_entry) => self.traverse_fs_only(
                                  has_ignored_ancestor,
                                  directory_hg_path,
                                  fs_entry,
                              ),
                          }
                          Ok(is_fs_only)
                      })
                      .try_reduce(|| false, |a, b| Ok(a || b))
                  }
                  fn traverse_fs_and_dirstate(
                      &self,
                      fs_path: &Path,
                      fs_metadata: &std::fs::Metadata,
                      dirstate_node: NodeRef<'tree, 'on_disk>,
                      has_ignored_ancestor: bool,
                  ) -> Result<(), DirstateV2ParseError> {
                      let hg_path = &dirstate_node.full_path_borrowed(self.dmap.on_disk)?;
                      let file_type = fs_metadata.file_type();
                      let file_or_symlink = file_type.is_file() || file_type.is_symlink();
                      if !file_or_symlink {
                          // If we previously had a file here, it was removed (with
                          // `hg rm` or similar) or deleted before it could be
                          // replaced by a directory or something else.
                          self.mark_removed_or_deleted_if_file(
                              &hg_path,
                              dirstate_node.state()?,
                          );
                      }
                      if file_type.is_dir() {
                          if self.options.collect_traversed_dirs {
                              self.outcome
                                  .lock()
                                  .unwrap()
                                  .traversed
                                  .push(hg_path.detach_from_tree())
                          }
                          let is_ignored = has_ignored_ancestor || (self.ignore_fn)(hg_path);
                          let is_at_repo_root = false;
                          let directory_has_any_fs_only_entry = self
                              .traverse_fs_directory_and_dirstate(
                                  is_ignored,
                                  dirstate_node.children(self.dmap.on_disk)?,
                                  hg_path,
                                  fs_path,
                                  Some(fs_metadata),
                                  dirstate_node.cached_directory_mtime(),
                                  is_at_repo_root,
                              )?;
                          self.maybe_save_directory_mtime(
                              directory_has_any_fs_only_entry,
                              fs_metadata,
                              dirstate_node,
                          )?
                      } else {
                          if file_or_symlink && self.matcher.matches(hg_path) {
                              if let Some(state) = dirstate_node.state()? {
                                  match state {
                                      EntryState::Added => self
                                          .outcome
                                          .lock()
                                          .unwrap()
                                          .added
                                          .push(hg_path.detach_from_tree()),
                                      EntryState::Removed => self
                                          .outcome
                                          .lock()
                                          .unwrap()
                                          .removed
                                          .push(hg_path.detach_from_tree()),
                                      EntryState::Merged => self
                                          .outcome
                                          .lock()
                                          .unwrap()
                                          .modified
                                          .push(hg_path.detach_from_tree()),
                                      EntryState::Normal => self
                                          .handle_normal_file(&dirstate_node, fs_metadata)?,
                                      // This variant is not used in DirstateMap
                                      // nodes
                                      EntryState::Unknown => unreachable!(),
                                  }
                              } else {
                                  // `node.entry.is_none()` indicates a "directory"
                                  // node, but the filesystem has a file
                                  self.mark_unknown_or_ignored(has_ignored_ancestor, hg_path)
                              }
                          }
                          for child_node in dirstate_node.children(self.dmap.on_disk)?.iter()
                          {
                              self.traverse_dirstate_only(child_node)?
                          }
                      }
                      Ok(())
                  }
                  fn maybe_save_directory_mtime(
                      &self,
                      directory_has_any_fs_only_entry: bool,
                      directory_metadata: &std::fs::Metadata,
                      dirstate_node: NodeRef<'tree, 'on_disk>,
                  ) -> Result<(), DirstateV2ParseError> {
                      if !directory_has_any_fs_only_entry {
                          // All filesystem directory entries from `read_dir` have a
                          // corresponding node in the dirstate, so we can reconstitute the
                          // names of those entries without calling `read_dir` again.
                          if let (Some(status_start), Ok(directory_mtime)) = (
                              &self.filesystem_time_at_status_start,
                              directory_metadata.modified(),
                          ) {
                              // Although the Rust standard library’s `SystemTime` type
                              // has nanosecond precision, the times reported for a
                              // directory’s (or file’s) modified time may have lower
                              // resolution based on the filesystem (for example ext3
                              // only stores integer seconds), kernel (see
                              // https://stackoverflow.com/a/14393315/1162888), etc.
                              if &directory_mtime >= status_start {
                                  // The directory was modified too recently, don’t cache its
                                  // `read_dir` results.
                                  //
                                  // A timeline like this is possible:
                                  //
                                  // 1. A change to this directory (direct child was
                                  //    added or removed) cause its mtime to be set
                                  //    (possibly truncated) to `directory_mtime`
                                  // 2. This `status` algorithm calls `read_dir`
                                  // 3. An other change is made to the same directory is
                                  //    made so that calling `read_dir` agin would give
                                  //    different results, but soon enough after 1. that
                                  //    the mtime stays the same
                                  //
                                  // On a system where the time resolution poor, this
                                  // scenario is not unlikely if all three steps are caused
                                  // by the same script.
                              } else {
                                  // We’ve observed (through `status_start`) that time has
                                  // “progressed” since `directory_mtime`, so any further
                                  // change to this directory is extremely likely to cause a
                                  // different mtime.
                                  //
                                  // Having the same mtime again is not entirely impossible
                                  // since the system clock is not monotonous. It could jump
                                  // backward to some point before `directory_mtime`, then a
                                  // directory change could potentially happen during exactly
                                  // the wrong tick.
                                  //
                                  // We deem this scenario (unlike the previous one) to be
                                  // unlikely enough in practice.
                                  let timestamp = directory_mtime.into();
                                  let cached = dirstate_node.cached_directory_mtime();
                                  if cached != Some(&timestamp) {
                                      let hg_path = dirstate_node
                                          .full_path_borrowed(self.dmap.on_disk)?
                                          .detach_from_tree();
                                      self.cached_directory_mtimes_to_add
                                          .lock()
                                          .unwrap()
                                          .push((hg_path, timestamp))
                                  }
                              }
                          }
                      }
                      Ok(())
                  }
                  /// A file with `EntryState::Normal` in the dirstate was found in the
                  /// filesystem
                  fn handle_normal_file(
                      &self,
                      dirstate_node: &NodeRef<'tree, 'on_disk>,
                      fs_metadata: &std::fs::Metadata,
                  ) -> Result<(), DirstateV2ParseError> {
                      // Keep the low 31 bits
                      fn truncate_u64(value: u64) -> i32 {
                          (value & 0x7FFF_FFFF) as i32
                      }
                      fn truncate_i64(value: i64) -> i32 {
                          (value & 0x7FFF_FFFF) as i32
                      }
                      let entry = dirstate_node
                          .entry()?
                          .expect("handle_normal_file called with entry-less node");
                      let hg_path = &dirstate_node.full_path_borrowed(self.dmap.on_disk)?;
                      let mode_changed =
                          || self.options.check_exec && entry.mode_changed(fs_metadata);
                      let size_changed = entry.size != truncate_u64(fs_metadata.len());
                      if entry.size >= 0
                          && size_changed
                          && fs_metadata.file_type().is_symlink()
                      {
                          // issue6456: Size returned may be longer due to encryption
                          // on EXT-4 fscrypt. TODO maybe only do it on EXT4?
                          self.outcome
                              .lock()
                              .unwrap()
                              .unsure
                              .push(hg_path.detach_from_tree())
                      } else if dirstate_node.has_copy_source()
                          || entry.is_from_other_parent()
                          || (entry.size >= 0 && (size_changed || mode_changed()))
                      {
                          self.outcome
                              .lock()
                              .unwrap()
                              .modified
                              .push(hg_path.detach_from_tree())
                      } else {
                          let mtime = mtime_seconds(fs_metadata);
                          if truncate_i64(mtime) != entry.mtime
                              || mtime == self.options.last_normal_time
                          {
                              self.outcome
                                  .lock()
                                  .unwrap()
                                  .unsure
                                  .push(hg_path.detach_from_tree())
                          } else if self.options.list_clean {
                              self.outcome
                                  .lock()
                                  .unwrap()
                                  .clean
                                  .push(hg_path.detach_from_tree())
                          }
                      }
                      Ok(())
                  }
                  /// A node in the dirstate tree has no corresponding filesystem entry
                  fn traverse_dirstate_only(
                      &self,
                      dirstate_node: NodeRef<'tree, 'on_disk>,
                  ) -> Result<(), DirstateV2ParseError> {
                      self.mark_removed_or_deleted_if_file(
                          &dirstate_node.full_path_borrowed(self.dmap.on_disk)?,
                          dirstate_node.state()?,
                      );
                      dirstate_node
                          .children(self.dmap.on_disk)?
                          .par_iter()
                          .map(|child_node| self.traverse_dirstate_only(child_node))
                          .collect()
                  }
                  /// A node in the dirstate tree has no corresponding *file* on the
                  /// filesystem
                  ///
                  /// Does nothing on a "directory" node
                  fn mark_removed_or_deleted_if_file(
                      &self,
                      hg_path: &BorrowedPath<'tree, 'on_disk>,
                      dirstate_node_state: Option<EntryState>,
                  ) {
                      if let Some(state) = dirstate_node_state {
                          if self.matcher.matches(hg_path) {
                              if let EntryState::Removed = state {
                                  self.outcome
                                      .lock()
                                      .unwrap()
                                      .removed
                                      .push(hg_path.detach_from_tree())
                              } else {
                                  self.outcome
                                      .lock()
                                      .unwrap()
                                      .deleted
                                      .push(hg_path.detach_from_tree())
                              }
                          }
                      }
                  }
                  /// Something in the filesystem has no corresponding dirstate node
                  fn traverse_fs_only(
                      &self,
                      has_ignored_ancestor: bool,
                      directory_hg_path: &HgPath,
                      fs_entry: &DirEntry,
                  ) {
                      let hg_path = directory_hg_path.join(&fs_entry.base_name);
                      let file_type = fs_entry.metadata.file_type();
                      let file_or_symlink = file_type.is_file() || file_type.is_symlink();
                      if file_type.is_dir() {
                          let is_ignored =
                              has_ignored_ancestor || (self.ignore_fn)(&hg_path);
                          let traverse_children = if is_ignored {
                              // Descendants of an ignored directory are all ignored
                              self.options.list_ignored
                          } else {
                              // Descendants of an unknown directory may be either unknown or
                              // ignored
                              self.options.list_unknown || self.options.list_ignored
                          };
                          if traverse_children {
                              let is_at_repo_root = false;
                              if let Ok(children_fs_entries) = self.read_dir(
                                  &hg_path,
                                  &fs_entry.full_path,
                                  is_at_repo_root,
                              ) {
                                  children_fs_entries.par_iter().for_each(|child_fs_entry| {
                                      self.traverse_fs_only(
                                          is_ignored,
                                          &hg_path,
                                          child_fs_entry,
                                      )
                                  })
                              }
                          }
                          if self.options.collect_traversed_dirs {
                              self.outcome.lock().unwrap().traversed.push(hg_path.into())
                          }
                      } else if file_or_symlink && self.matcher.matches(&hg_path) {
                          self.mark_unknown_or_ignored(
                              has_ignored_ancestor,
                              &BorrowedPath::InMemory(&hg_path),
                          )
                      }
                  }
                  fn mark_unknown_or_ignored(
                      &self,
                      has_ignored_ancestor: bool,
                      hg_path: &BorrowedPath<'_, 'on_disk>,
                  ) {
                      let is_ignored = has_ignored_ancestor || (self.ignore_fn)(&hg_path);
                      if is_ignored {
                          if self.options.list_ignored {
                              self.outcome
                                  .lock()
                                  .unwrap()
                                  .ignored
                                  .push(hg_path.detach_from_tree())
                          }
                      } else {
                          if self.options.list_unknown {
                              self.outcome
                                  .lock()
                                  .unwrap()
                                  .unknown
                                  .push(hg_path.detach_from_tree())
                          }
                      }
                  }
              }
              #[cfg(unix)] // TODO
              fn mtime_seconds(metadata: &std::fs::Metadata) -> i64 {
                  // Going through `Metadata::modified()` would be portable, but would take
                  // care to construct a `SystemTime` value with sub-second precision just
                  // for us to throw that away here.
                  use std::os::unix::fs::MetadataExt;
                  metadata.mtime()
              }
              struct DirEntry {
                  base_name: HgPathBuf,
                  full_path: PathBuf,
                  metadata: std::fs::Metadata,
              }
              impl DirEntry {
                  /// Returns **unsorted** entries in the given directory, with name and
                  /// metadata.
                  ///
                  /// If a `.hg` sub-directory is encountered:
                  ///
                  /// * At the repository root, ignore that sub-directory
                  /// * Elsewhere, we’re listing the content of a sub-repo. Return an empty
                  ///   list instead.
                  fn read_dir(path: &Path, is_at_repo_root: bool) -> io::Result<Vec<Self>> {
                      let mut results = Vec::new();
                      for entry in path.read_dir()? {
                          let entry = entry?;
                          let metadata = entry.metadata()?;
                          let name = get_bytes_from_os_string(entry.file_name());
                          // FIXME don't do this when cached
                          if name == b".hg" {
                              if is_at_repo_root {
                                  // Skip the repo’s own .hg (might be a symlink)
                                  continue;
                              } else if metadata.is_dir() {
                                  // A .hg sub-directory at another location means a subrepo,
                                  // skip it entirely.
                                  return Ok(Vec::new());
                              }
                          }
                          results.push(DirEntry {
                              base_name: name.into(),
                              full_path: entry.path(),
                              metadata,
                          })
                      }
                      Ok(results)
                  }
              }
              /// Return the `mtime` of a temporary file newly-created in the `.hg` directory
              /// of the give repository.
              ///
              /// This is similar to `SystemTime::now()`, with the result truncated to the
              /// same time resolution as other files’ modification times. Using `.hg`
              /// instead of the system’s default temporary directory (such as `/tmp`) makes
              /// it more likely the temporary file is in the same disk partition as contents
              /// of the working directory, which can matter since different filesystems may
              /// store timestamps with different resolutions.
              ///
              /// This may fail, typically if we lack write permissions. In that case we
              /// should continue the `status()` algoritm anyway and consider the current
              /// date/time to be unknown.
              fn filesystem_now(repo_root: &Path) -> Result<SystemTime, io::Error> {
                  tempfile::tempfile_in(repo_root.join(".hg"))?
                      .metadata()?
                      .modified()
              }

rust/hg-cpython/src/dirstate/status.rs

0 +2 0

              // status.rs
              //
              // Copyright 2019, Raphaël Gomès <rgomes@octobus.net>
              //
              // This software may be used and distributed according to the terms of the
              // GNU General Public License version 2 or any later version.
              //! Bindings for the `hg::status` module provided by the
              //! `hg-core` crate. From Python, this will be seen as
              //! `rustext.dirstate.status`.
              use crate::{dirstate::DirstateMap, exceptions::FallbackError};
              use cpython::exc::OSError;
              use cpython::{
                  exc::ValueError, ObjectProtocol, PyBytes, PyErr, PyList, PyObject,
                  PyResult, PyTuple, Python, PythonObject, ToPyObject,
              };
              use hg::{
                  matchers::{AlwaysMatcher, FileMatcher, IncludeMatcher},
                  parse_pattern_syntax,
                  utils::{
                      files::{get_bytes_from_path, get_path_from_bytes},
                      hg_path::{HgPath, HgPathBuf},
                  },
                  BadMatch, DirstateStatus, IgnorePattern, PatternFileWarning, StatusError,
                  StatusOptions,
              };
              use std::borrow::Borrow;
              /// This will be useless once trait impls for collection are added to `PyBytes`
              /// upstream.
              fn collect_pybytes_list(
                  py: Python,
                  collection: &[impl AsRef<HgPath>],
              ) -> PyList {
                  let list = PyList::new(py, &[]);
                  for path in collection.iter() {
                      list.append(
                          py,
                          PyBytes::new(py, path.as_ref().as_bytes()).into_object(),
                      )
                  }
                  list
              }
              fn collect_bad_matches(
                  py: Python,
                  collection: &[(impl AsRef<HgPath>, BadMatch)],
              ) -> PyResult<PyList> {
                  let list = PyList::new(py, &[]);
                  let os = py.import("os")?;
                  let get_error_message = |code: i32| -> PyResult<_> {
                      os.call(
                          py,
                          "strerror",
                          PyTuple::new(py, &[code.to_py_object(py).into_object()]),
                          None,
                      )
                  };
                  for (path, bad_match) in collection.iter() {
                      let message = match bad_match {
                          BadMatch::OsError(code) => get_error_message(*code)?,
                          BadMatch::BadType(bad_type) => format!(
                              "unsupported file type (type is {})",
                              bad_type.to_string()
                          )
                          .to_py_object(py)
                          .into_object(),
                      };
                      list.append(
                          py,
                          (PyBytes::new(py, path.as_ref().as_bytes()), message)
                              .to_py_object(py)
                              .into_object(),
                      )
                  }
                  Ok(list)
              }
              fn handle_fallback(py: Python, err: StatusError) -> PyErr {
                  match err {
                      StatusError::Pattern(e) => {
                          let as_string = e.to_string();
                          log::trace!("Rust status fallback: `{}`", &as_string);
                          PyErr::new::<FallbackError, _>(py, &as_string)
                      }
                      StatusError::IO(e) => PyErr::new::<OSError, _>(py, e.to_string()),
                      e => PyErr::new::<ValueError, _>(py, e.to_string()),
                  }
              }
              pub fn status_wrapper(
                  py: Python,
                  dmap: DirstateMap,
                  matcher: PyObject,
                  root_dir: PyObject,
                  ignore_files: PyList,
                  check_exec: bool,
                  last_normal_time: i64,
                  list_clean: bool,
                  list_ignored: bool,
                  list_unknown: bool,
                  collect_traversed_dirs: bool,
              ) -> PyResult<PyTuple> {
                  let bytes = root_dir.extract::<PyBytes>(py)?;
                  let root_dir = get_path_from_bytes(bytes.data(py));
                  let dmap: DirstateMap = dmap.to_py_object(py);
                  let mut dmap = dmap.get_inner_mut(py);
                  let ignore_files: PyResult<Vec<_>> = ignore_files
                      .iter(py)
                      .map(|b| {
                          let file = b.extract::<PyBytes>(py)?;
                          Ok(get_path_from_bytes(file.data(py)).to_owned())
                      })
                      .collect();
                  let ignore_files = ignore_files?;
                  match matcher.get_type(py).name(py).borrow() {
                      "alwaysmatcher" => {
                          let matcher = AlwaysMatcher;
                          let (status_res, warnings) = dmap
                              .status(
                                  &matcher,
                                  root_dir.to_path_buf(),
                                  ignore_files,
                                  StatusOptions {
                                      check_exec,
                                      last_normal_time,
                                      list_clean,
                                      list_ignored,
                                      list_unknown,
                                      collect_traversed_dirs,
                                  },
                              )
                              .map_err(|e| handle_fallback(py, e))?;
                          build_response(py, status_res, warnings)
                      }
                      "exactmatcher" => {
                          let files = matcher.call_method(
                              py,
                              "files",
                              PyTuple::new(py, &[]),
                              None,
                          )?;
                          let files: PyList = files.cast_into(py)?;
                          let files: PyResult<Vec<HgPathBuf>> = files
                              .iter(py)
                              .map(|f| {
                                  Ok(HgPathBuf::from_bytes(
                                      f.extract::<PyBytes>(py)?.data(py),
                                  ))
                              })
                              .collect();
                          let files = files?;
                          let matcher = FileMatcher::new(files.as_ref())
                              .map_err(|e| PyErr::new::<ValueError, _>(py, e.to_string()))?;
                          let (status_res, warnings) = dmap
                              .status(
                                  &matcher,
                                  root_dir.to_path_buf(),
                                  ignore_files,
                                  StatusOptions {
                                      check_exec,
                                      last_normal_time,
                                      list_clean,
                                      list_ignored,
                                      list_unknown,
                                      collect_traversed_dirs,
                                  },
                              )
                              .map_err(|e| handle_fallback(py, e))?;
                          build_response(py, status_res, warnings)
                      }
                      "includematcher" => {
                          // Get the patterns from Python even though most of them are
                          // redundant with those we will parse later on, as they include
                          // those passed from the command line.
                          let ignore_patterns: PyResult<Vec<_>> = matcher
                              .getattr(py, "_kindpats")?
                              .iter(py)?
                              .map(|k| {
                                  let k = k?;
                                  let syntax = parse_pattern_syntax(
                                      &[
                                          k.get_item(py, 0)?
                                              .extract::<PyBytes>(py)?
                                              .data(py),
                                          &b":"[..],
                                      ]
                                      .concat(),
                                  )
                                  .map_err(|e| {
                                      handle_fallback(py, StatusError::Pattern(e))
                                  })?;
                                  let pattern = k.get_item(py, 1)?.extract::<PyBytes>(py)?;
                                  let pattern = pattern.data(py);
                                  let source = k.get_item(py, 2)?.extract::<PyBytes>(py)?;
                                  let source = get_path_from_bytes(source.data(py));
                                  let new = IgnorePattern::new(syntax, pattern, source);
                                  Ok(new)
                              })
                              .collect();
                          let ignore_patterns = ignore_patterns?;
                          let mut all_warnings = vec![];
                          let (matcher, warnings) =
                              IncludeMatcher::new(ignore_patterns, &root_dir)
                                  .map_err(|e| handle_fallback(py, e.into()))?;
                          all_warnings.extend(warnings);
                          let (status_res, warnings) = dmap
                              .status(
                                  &matcher,
                                  root_dir.to_path_buf(),
                                  ignore_files,
                                  StatusOptions {
                                      check_exec,
                                      last_normal_time,
                                      list_clean,
                                      list_ignored,
                                      list_unknown,
                                      collect_traversed_dirs,
                                  },
                              )
                              .map_err(|e| handle_fallback(py, e))?;
                          all_warnings.extend(warnings);
                          build_response(py, status_res, all_warnings)
                      }
                      e => Err(PyErr::new::<ValueError, _>(
                          py,
                          format!("Unsupported matcher {}", e),
                      )),
                  }
              }
              fn build_response(
                  py: Python,
                  status_res: DirstateStatus,
                  warnings: Vec<PatternFileWarning>,
              ) -> PyResult<PyTuple> {
                  let modified = collect_pybytes_list(py, status_res.modified.as_ref());
                  let added = collect_pybytes_list(py, status_res.added.as_ref());
                  let removed = collect_pybytes_list(py, status_res.removed.as_ref());
                  let deleted = collect_pybytes_list(py, status_res.deleted.as_ref());
                  let clean = collect_pybytes_list(py, status_res.clean.as_ref());
                  let ignored = collect_pybytes_list(py, status_res.ignored.as_ref());
                  let unknown = collect_pybytes_list(py, status_res.unknown.as_ref());
                  let unsure = collect_pybytes_list(py, status_res.unsure.as_ref());
                  let bad = collect_bad_matches(py, status_res.bad.as_ref())?;
                  let traversed = collect_pybytes_list(py, status_res.traversed.as_ref());
+                 let dirty = status_res.dirty.to_py_object(py);
                  let py_warnings = PyList::new(py, &[]);
                  for warning in warnings.iter() {
                      // We use duck-typing on the Python side for dispatch, good enough for
                      // now.
                      match warning {
                          PatternFileWarning::InvalidSyntax(file, syn) => {
                              py_warnings.append(
                                  py,
                                  (
                                      PyBytes::new(py, &get_bytes_from_path(&file)),
                                      PyBytes::new(py, syn),
                                  )
                                      .to_py_object(py)
                                      .into_object(),
                              );
                          }
                          PatternFileWarning::NoSuchFile(file) => py_warnings.append(
                              py,
                              PyBytes::new(py, &get_bytes_from_path(&file)).into_object(),
                          ),
                      }
                  }
                  Ok(PyTuple::new(
                      py,
                      &[
                          unsure.into_object(),
                          modified.into_object(),
                          added.into_object(),
                          removed.into_object(),
                          deleted.into_object(),
                          clean.into_object(),
                          ignored.into_object(),
                          unknown.into_object(),
                          py_warnings.into_object(),
                          bad.into_object(),
                          traversed.into_object(),
+                         dirty.into_object(),
                      ][..],
                  ))
              }

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages