upstream/mercurial-mirror Commit - r16955:92e1c64b

parsers: add a C function to pack the dirstate...

Bryan O'Sullivan -

r16955:92e1c64b default

parent child

mercurial/dirstate.py

0 +15 -6

              # dirstate.py - working directory tracking for mercurial
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              import errno
              from node import nullid
              from i18n import _
              import scmutil, util, ignore, osutil, parsers, encoding
              import struct, os, stat, errno
              import cStringIO
              _format = ">cllll"
              propertycache = util.propertycache
              filecache = scmutil.filecache
              class repocache(filecache):
                  """filecache for files in .hg/"""
                  def join(self, obj, fname):
                      return obj._opener.join(fname)
              class rootcache(filecache):
                  """filecache for files in the repository root"""
                  def join(self, obj, fname):
                      return obj._join(fname)
              def _finddirs(path):
                  pos = path.rfind('/')
                  while pos != -1:
                      yield path[:pos]
                      pos = path.rfind('/', 0, pos)
              def _incdirs(dirs, path):
                  for base in _finddirs(path):
                      if base in dirs:
                          dirs[base] += 1
                          return
                      dirs[base] = 1
              def _decdirs(dirs, path):
                  for base in _finddirs(path):
                      if dirs[base] > 1:
                          dirs[base] -= 1
                          return
                      del dirs[base]
              class dirstate(object):
                  def __init__(self, opener, ui, root, validate):
                      '''Create a new dirstate object.
                      opener is an open()-like callable that can be used to open the
                      dirstate file; root is the root of the directory tracked by
                      the dirstate.
                      '''
                      self._opener = opener
                      self._validate = validate
                      self._root = root
                      self._rootdir = os.path.join(root, '')
                      self._dirty = False
                      self._dirtypl = False
                      self._lastnormaltime = 0
                      self._ui = ui
                      self._filecache = {}
                  @propertycache
                  def _map(self):
                      '''Return the dirstate contents as a map from filename to
                      (state, mode, size, time).'''
                      self._read()
                      return self._map
                  @propertycache
                  def _copymap(self):
                      self._read()
                      return self._copymap
                  @propertycache
                  def _foldmap(self):
                      f = {}
                      for name in self._map:
                          f[util.normcase(name)] = name
                      for name in self._dirs:
                          f[util.normcase(name)] = name
                      f['.'] = '.' # prevents useless util.fspath() invocation
                      return f
                  @repocache('branch')
                  def _branch(self):
                      try:
                          return self._opener.read("branch").strip() or "default"
                      except IOError, inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          return "default"
                  @propertycache
                  def _pl(self):
                      try:
                          fp = self._opener("dirstate")
                          st = fp.read(40)
                          fp.close()
                          l = len(st)
                          if l == 40:
                              return st[:20], st[20:40]
                          elif l > 0 and l < 40:
                              raise util.Abort(_('working directory state appears damaged!'))
                      except IOError, err:
                          if err.errno != errno.ENOENT:
                              raise
                      return [nullid, nullid]
                  @propertycache
                  def _dirs(self):
                      dirs = {}
                      for f, s in self._map.iteritems():
                          if s[0] != 'r':
                              _incdirs(dirs, f)
                      return dirs
                  def dirs(self):
                      return self._dirs
                  @rootcache('.hgignore')
                  def _ignore(self):
                      files = [self._join('.hgignore')]
                      for name, path in self._ui.configitems("ui"):
                          if name == 'ignore' or name.startswith('ignore.'):
                              files.append(util.expandpath(path))
                      return ignore.ignore(self._root, files, self._ui.warn)
                  @propertycache
                  def _slash(self):
                      return self._ui.configbool('ui', 'slash') and os.sep != '/'
                  @propertycache
                  def _checklink(self):
                      return util.checklink(self._root)
                  @propertycache
                  def _checkexec(self):
                      return util.checkexec(self._root)
                  @propertycache
                  def _checkcase(self):
                      return not util.checkcase(self._join('.hg'))
                  def _join(self, f):
                      # much faster than os.path.join()
                      # it's safe because f is always a relative path
                      return self._rootdir + f
                  def flagfunc(self, buildfallback):
                      if self._checklink and self._checkexec:
                          def f(x):
                              p = self._join(x)
                              if os.path.islink(p):
                                  return 'l'
                              if util.isexec(p):
                                  return 'x'
                              return ''
                          return f
                      fallback = buildfallback()
                      if self._checklink:
                          def f(x):
                              if os.path.islink(self._join(x)):
                                  return 'l'
                              if 'x' in fallback(x):
                                  return 'x'
                              return ''
                          return f
                      if self._checkexec:
                          def f(x):
                              if 'l' in fallback(x):
                                  return 'l'
                              if util.isexec(self._join(x)):
                                  return 'x'
                              return ''
                          return f
                      else:
                          return fallback
                  def getcwd(self):
                      cwd = os.getcwd()
                      if cwd == self._root:
                          return ''
                      # self._root ends with a path separator if self._root is '/' or 'C:\'
                      rootsep = self._root
                      if not util.endswithsep(rootsep):
                          rootsep += os.sep
                      if cwd.startswith(rootsep):
                          return cwd[len(rootsep):]
                      else:
                          # we're outside the repo. return an absolute path.
                          return cwd
                  def pathto(self, f, cwd=None):
                      if cwd is None:
                          cwd = self.getcwd()
                      path = util.pathto(self._root, cwd, f)
                      if self._slash:
                          return util.normpath(path)
                      return path
                  def __getitem__(self, key):
                      '''Return the current state of key (a filename) in the dirstate.
                      States are:
                        n  normal
                        m  needs merging
                        r  marked for removal
                        a  marked for addition
                        ?  not tracked
                      '''
                      return self._map.get(key, ("?",))[0]
                  def __contains__(self, key):
                      return key in self._map
                  def __iter__(self):
                      for x in sorted(self._map):
                          yield x
                  def parents(self):
                      return [self._validate(p) for p in self._pl]
                  def p1(self):
                      return self._validate(self._pl[0])
                  def p2(self):
                      return self._validate(self._pl[1])
                  def branch(self):
                      return encoding.tolocal(self._branch)
                  def setparents(self, p1, p2=nullid):
                      """Set dirstate parents to p1 and p2.
                      When moving from two parents to one, 'm' merged entries a
                      adjusted to normal and previous copy records discarded and
                      returned by the call.
                      See localrepo.setparents()
                      """
                      self._dirty = self._dirtypl = True
                      oldp2 = self._pl[1]
                      self._pl = p1, p2
                      copies = {}
                      if oldp2 != nullid and p2 == nullid:
                          # Discard 'm' markers when moving away from a merge state
                          for f, s in self._map.iteritems():
                              if s[0] == 'm':
                                  if f in self._copymap:
                                      copies[f] = self._copymap[f]
                                  self.normallookup(f)
                      return copies
                  def setbranch(self, branch):
                      if branch in ['tip', '.', 'null']:
                          raise util.Abort(_('the name \'%s\' is reserved') % branch)
                      self._branch = encoding.fromlocal(branch)
                      f = self._opener('branch', 'w', atomictemp=True)
                      try:
                          f.write(self._branch + '\n')
                      finally:
                          f.close()
                  def _read(self):
                      self._map = {}
                      self._copymap = {}
                      try:
                          st = self._opener.read("dirstate")
                      except IOError, err:
                          if err.errno != errno.ENOENT:
                              raise
                          return
                      if not st:
                          return
                      p = parsers.parse_dirstate(self._map, self._copymap, st)
                      if not self._dirtypl:
                          self._pl = p
                  def invalidate(self):
                      for a in ("_map", "_copymap", "_foldmap", "_branch", "_pl", "_dirs",
                              "_ignore"):
                          if a in self.__dict__:
                              delattr(self, a)
                      self._lastnormaltime = 0
                      self._dirty = False
                  def copy(self, source, dest):
                      """Mark dest as a copy of source. Unmark dest if source is None."""
                      if source == dest:
                          return
                      self._dirty = True
                      if source is not None:
                          self._copymap[dest] = source
                      elif dest in self._copymap:
                          del self._copymap[dest]
                  def copied(self, file):
                      return self._copymap.get(file, None)
                  def copies(self):
                      return self._copymap
                  def _droppath(self, f):
                      if self[f] not in "?r" and "_dirs" in self.__dict__:
                          _decdirs(self._dirs, f)
                  def _addpath(self, f, check=False):
                      oldstate = self[f]
                      if check or oldstate == "r":
                          scmutil.checkfilename(f)
                          if f in self._dirs:
                              raise util.Abort(_('directory %r already in dirstate') % f)
                          # shadows
                          for d in _finddirs(f):
                              if d in self._dirs:
                                  break
                              if d in self._map and self[d] != 'r':
                                  raise util.Abort(
                                      _('file %r in dirstate clashes with %r') % (d, f))
                      if oldstate in "?r" and "_dirs" in self.__dict__:
                          _incdirs(self._dirs, f)
                  def normal(self, f):
                      '''Mark a file normal and clean.'''
                      self._dirty = True
                      self._addpath(f)
                      s = os.lstat(self._join(f))
                      mtime = int(s.st_mtime)
                      self._map[f] = ('n', s.st_mode, s.st_size, mtime)
                      if f in self._copymap:
                          del self._copymap[f]
                      if mtime > self._lastnormaltime:
                          # Remember the most recent modification timeslot for status(),
                          # to make sure we won't miss future size-preserving file content
                          # modifications that happen within the same timeslot.
                          self._lastnormaltime = mtime
                  def normallookup(self, f):
                      '''Mark a file normal, but possibly dirty.'''
                      if self._pl[1] != nullid and f in self._map:
                          # if there is a merge going on and the file was either
                          # in state 'm' (-1) or coming from other parent (-2) before
                          # being removed, restore that state.
                          entry = self._map[f]
                          if entry[0] == 'r' and entry[2] in (-1, -2):
                              source = self._copymap.get(f)
                              if entry[2] == -1:
                                  self.merge(f)
                              elif entry[2] == -2:
                                  self.otherparent(f)
                              if source:
                                  self.copy(source, f)
                              return
                          if entry[0] == 'm' or entry[0] == 'n' and entry[2] == -2:
                              return
                      self._dirty = True
                      self._addpath(f)
                      self._map[f] = ('n', 0, -1, -1)
                      if f in self._copymap:
                          del self._copymap[f]
                  def otherparent(self, f):
                      '''Mark as coming from the other parent, always dirty.'''
                      if self._pl[1] == nullid:
                          raise util.Abort(_("setting %r to other parent "
                                             "only allowed in merges") % f)
                      self._dirty = True
                      self._addpath(f)
                      self._map[f] = ('n', 0, -2, -1)
                      if f in self._copymap:
                          del self._copymap[f]
                  def add(self, f):
                      '''Mark a file added.'''
                      self._dirty = True
                      self._addpath(f, True)
                      self._map[f] = ('a', 0, -1, -1)
                      if f in self._copymap:
                          del self._copymap[f]
                  def remove(self, f):
                      '''Mark a file removed.'''
                      self._dirty = True
                      self._droppath(f)
                      size = 0
                      if self._pl[1] != nullid and f in self._map:
                          # backup the previous state
                          entry = self._map[f]
                          if entry[0] == 'm': # merge
                              size = -1
                          elif entry[0] == 'n' and entry[2] == -2: # other parent
                              size = -2
                      self._map[f] = ('r', 0, size, 0)
                      if size == 0 and f in self._copymap:
                          del self._copymap[f]
                  def merge(self, f):
                      '''Mark a file merged.'''
                      if self._pl[1] == nullid:
                          return self.normallookup(f)
                      self._dirty = True
                      s = os.lstat(self._join(f))
                      self._addpath(f)
                      self._map[f] = ('m', s.st_mode, s.st_size, int(s.st_mtime))
                      if f in self._copymap:
                          del self._copymap[f]
                  def drop(self, f):
                      '''Drop a file from the dirstate'''
                      if f in self._map:
                          self._dirty = True
                          self._droppath(f)
                          del self._map[f]
                  def _normalize(self, path, isknown, ignoremissing=False, exists=None):
                      normed = util.normcase(path)
                      folded = self._foldmap.get(normed, None)
                      if folded is None:
                          if isknown:
                              folded = path
                          else:
                              if exists is None:
                                  exists = os.path.lexists(os.path.join(self._root, path))
                              if not exists:
                                  # Maybe a path component exists
                                  if not ignoremissing and '/' in path:
                                      d, f = path.rsplit('/', 1)
                                      d = self._normalize(d, isknown, ignoremissing, None)
                                      folded = d + "/" + f
                                  else:
                                      # No path components, preserve original case
                                      folded = path
                              else:
                                  # recursively normalize leading directory components
                                  # against dirstate
                                  if '/' in normed:
                                      d, f = normed.rsplit('/', 1)
                                      d = self._normalize(d, isknown, ignoremissing, True)
                                      r = self._root + "/" + d
                                      folded = d + "/" + util.fspath(f, r)
                                  else:
                                      folded = util.fspath(normed, self._root)
                                  self._foldmap[normed] = folded
                      return folded
                  def normalize(self, path, isknown=False, ignoremissing=False):
                      '''
                      normalize the case of a pathname when on a casefolding filesystem
                      isknown specifies whether the filename came from walking the
                      disk, to avoid extra filesystem access.
                      If ignoremissing is True, missing path are returned
                      unchanged. Otherwise, we try harder to normalize possibly
                      existing path components.
                      The normalized case is determined based on the following precedence:
                      - version of name already stored in the dirstate
                      - version of name stored on disk
                      - version provided via command arguments
                      '''
                      if self._checkcase:
                          return self._normalize(path, isknown, ignoremissing)
                      return path
                  def clear(self):
                      self._map = {}
                      if "_dirs" in self.__dict__:
                          delattr(self, "_dirs")
                      self._copymap = {}
                      self._pl = [nullid, nullid]
                      self._lastnormaltime = 0
                      self._dirty = True
                  def rebuild(self, parent, files):
                      self.clear()
                      for f in files:
                          if 'x' in files.flags(f):
                              self._map[f] = ('n', 0777, -1, 0)
                          else:
                              self._map[f] = ('n', 0666, -1, 0)
                      self._pl = (parent, nullid)
                      self._dirty = True
                  def write(self):
                      if not self._dirty:
                          return
                      st = self._opener("dirstate", "w", atomictemp=True)
+                     def finish(s):
+                         st.write(s)
+                         st.close()
+                         self._lastnormaltime = 0
+                         self._dirty = self._dirtypl = False
                      # use the modification time of the newly created temporary file as the
                      # filesystem's notion of 'now'
-                     now = int(util.fstat(st).st_mtime)
+                     now = util.fstat(st).st_mtime
+                     copymap = self._copymap
+                     try:
+                         finish(parsers.pack_dirstate(self._map, copymap, self._pl, now))
+                         return
+                     except AttributeError:
+                         pass
+                     now = int(now)
                      cs = cStringIO.StringIO()
-                     copymap = self._copymap
                      pack = struct.pack
                      write = cs.write
                      write("".join(self._pl))
                      for f, e in self._map.iteritems():
                          if e[0] == 'n' and e[3] == now:
                              # The file was last modified "simultaneously" with the current
                              # write to dirstate (i.e. within the same second for file-
                              # systems with a granularity of 1 sec). This commonly happens
                              # for at least a couple of files on 'update'.
                              # The user could change the file without changing its size
                              # within the same second. Invalidate the file's stat data in
                              # dirstate, forcing future 'status' calls to compare the
                              # contents of the file. This prevents mistakenly treating such
                              # files as clean.
                              e = (e[0], 0, -1, -1)   # mark entry as 'unset'
                              self._map[f] = e
                          if f in copymap:
                              f = "%s\0%s" % (f, copymap[f])
                          e = pack(_format, e[0], e[1], e[2], e[3], len(f))
                          write(e)
                          write(f)
-                     st.write(cs.getvalue())
-                     st.close()
-                     self._lastnormaltime = 0
-                     self._dirty = self._dirtypl = False
+                     finish(cs.getvalue())
                  def _dirignore(self, f):
                      if f == '.':
                          return False
                      if self._ignore(f):
                          return True
                      for p in _finddirs(f):
                          if self._ignore(p):
                              return True
                      return False
                  def walk(self, match, subrepos, unknown, ignored):
                      '''
                      Walk recursively through the directory tree, finding all files
                      matched by match.
                      Return a dict mapping filename to stat-like object (either
                      mercurial.osutil.stat instance or return value of os.stat()).
                      '''
                      def fwarn(f, msg):
                          self._ui.warn('%s: %s\n' % (self.pathto(f), msg))
                          return False
                      def badtype(mode):
                          kind = _('unknown')
                          if stat.S_ISCHR(mode):
                              kind = _('character device')
                          elif stat.S_ISBLK(mode):
                              kind = _('block device')
                          elif stat.S_ISFIFO(mode):
                              kind = _('fifo')
                          elif stat.S_ISSOCK(mode):
                              kind = _('socket')
                          elif stat.S_ISDIR(mode):
                              kind = _('directory')
                          return _('unsupported file type (type is %s)') % kind
                      ignore = self._ignore
                      dirignore = self._dirignore
                      if ignored:
                          ignore = util.never
                          dirignore = util.never
                      elif not unknown:
                          # if unknown and ignored are False, skip step 2
                          ignore = util.always
                          dirignore = util.always
                      matchfn = match.matchfn
                      badfn = match.bad
                      dmap = self._map
                      normpath = util.normpath
                      listdir = osutil.listdir
                      lstat = os.lstat
                      getkind = stat.S_IFMT
                      dirkind = stat.S_IFDIR
                      regkind = stat.S_IFREG
                      lnkkind = stat.S_IFLNK
                      join = self._join
                      work = []
                      wadd = work.append
                      exact = skipstep3 = False
                      if matchfn == match.exact: # match.exact
                          exact = True
                          dirignore = util.always # skip step 2
                      elif match.files() and not match.anypats(): # match.match, no patterns
                          skipstep3 = True
                      if not exact and self._checkcase:
                          normalize = self._normalize
                          skipstep3 = False
                      else:
                          normalize = lambda x, y, z: x
                      files = sorted(match.files())
                      subrepos.sort()
                      i, j = 0, 0
                      while i < len(files) and j < len(subrepos):
                          subpath = subrepos[j] + "/"
                          if files[i] < subpath:
                              i += 1
                              continue
                          while i < len(files) and files[i].startswith(subpath):
                              del files[i]
                          j += 1
                      if not files or '.' in files:
                          files = ['']
                      results = dict.fromkeys(subrepos)
                      results['.hg'] = None
                      # step 1: find all explicit files
                      for ff in files:
                          nf = normalize(normpath(ff), False, True)
                          if nf in results:
                              continue
                          try:
                              st = lstat(join(nf))
                              kind = getkind(st.st_mode)
                              if kind == dirkind:
                                  skipstep3 = False
                                  if nf in dmap:
                                      #file deleted on disk but still in dirstate
                                      results[nf] = None
                                  match.dir(nf)
                                  if not dirignore(nf):
                                      wadd(nf)
                              elif kind == regkind or kind == lnkkind:
                                  results[nf] = st
                              else:
                                  badfn(ff, badtype(kind))
                                  if nf in dmap:
                                      results[nf] = None
                          except OSError, inst:
                              if nf in dmap: # does it exactly match a file?
                                  results[nf] = None
                              else: # does it match a directory?
                                  prefix = nf + "/"
                                  for fn in dmap:
                                      if fn.startswith(prefix):
                                          match.dir(nf)
                                          skipstep3 = False
                                          break
                                  else:
                                      badfn(ff, inst.strerror)
                      # step 2: visit subdirectories
                      while work:
                          nd = work.pop()
                          skip = None
                          if nd == '.':
                              nd = ''
                          else:
                              skip = '.hg'
                          try:
                              entries = listdir(join(nd), stat=True, skip=skip)
                          except OSError, inst:
                              if inst.errno == errno.EACCES:
                                  fwarn(nd, inst.strerror)
                                  continue
                              raise
                          for f, kind, st in entries:
                              nf = normalize(nd and (nd + "/" + f) or f, True, True)
                              if nf not in results:
                                  if kind == dirkind:
                                      if not ignore(nf):
                                          match.dir(nf)
                                          wadd(nf)
                                      if nf in dmap and matchfn(nf):
                                          results[nf] = None
                                  elif kind == regkind or kind == lnkkind:
                                      if nf in dmap:
                                          if matchfn(nf):
                                              results[nf] = st
                                      elif matchfn(nf) and not ignore(nf):
                                          results[nf] = st
                                  elif nf in dmap and matchfn(nf):
                                      results[nf] = None
                      # step 3: report unseen items in the dmap hash
                      if not skipstep3 and not exact:
                          visit = sorted([f for f in dmap if f not in results and matchfn(f)])
                          for nf, st in zip(visit, util.statfiles([join(i) for i in visit])):
                              if (not st is None and
                                  getkind(st.st_mode) not in (regkind, lnkkind)):
                                  st = None
                              results[nf] = st
                      for s in subrepos:
                          del results[s]
                      del results['.hg']
                      return results
                  def status(self, match, subrepos, ignored, clean, unknown):
                      '''Determine the status of the working copy relative to the
                      dirstate and return a tuple of lists (unsure, modified, added,
                      removed, deleted, unknown, ignored, clean), where:
                        unsure:
                          files that might have been modified since the dirstate was
                          written, but need to be read to be sure (size is the same
                          but mtime differs)
                        modified:
                          files that have definitely been modified since the dirstate
                          was written (different size or mode)
                        added:
                          files that have been explicitly added with hg add
                        removed:
                          files that have been explicitly removed with hg remove
                        deleted:
                          files that have been deleted through other means ("missing")
                        unknown:
                          files not in the dirstate that are not ignored
                        ignored:
                          files not in the dirstate that are ignored
                          (by _dirignore())
                        clean:
                          files that have definitely not been modified since the
                          dirstate was written
                      '''
                      listignored, listclean, listunknown = ignored, clean, unknown
                      lookup, modified, added, unknown, ignored = [], [], [], [], []
                      removed, deleted, clean = [], [], []
                      dmap = self._map
                      ladd = lookup.append            # aka "unsure"
                      madd = modified.append
                      aadd = added.append
                      uadd = unknown.append
                      iadd = ignored.append
                      radd = removed.append
                      dadd = deleted.append
                      cadd = clean.append
                      lnkkind = stat.S_IFLNK
                      for fn, st in self.walk(match, subrepos, listunknown,
                                              listignored).iteritems():
                          if fn not in dmap:
                              if (listignored or match.exact(fn)) and self._dirignore(fn):
                                  if listignored:
                                      iadd(fn)
                              elif listunknown:
                                  uadd(fn)
                              continue
                          state, mode, size, time = dmap[fn]
                          if not st and state in "nma":
                              dadd(fn)
                          elif state == 'n':
                              # The "mode & lnkkind != lnkkind or self._checklink"
                              # lines are an expansion of "islink => checklink"
                              # where islink means "is this a link?" and checklink
                              # means "can we check links?".
                              mtime = int(st.st_mtime)
                              if (size >= 0 and
                                  (size != st.st_size
                                   or ((mode ^ st.st_mode) & 0100 and self._checkexec))
                                  and (mode & lnkkind != lnkkind or self._checklink)
                                  or size == -2 # other parent
                                  or fn in self._copymap):
                                  madd(fn)
                              elif (mtime != time
                                    and (mode & lnkkind != lnkkind or self._checklink)):
                                  ladd(fn)
                              elif mtime == self._lastnormaltime:
                                  # fn may have been changed in the same timeslot without
                                  # changing its size. This can happen if we quickly do
                                  # multiple commits in a single transaction.
                                  # Force lookup, so we don't miss such a racy file change.
                                  ladd(fn)
                              elif listclean:
                                  cadd(fn)
                          elif state == 'm':
                              madd(fn)
                          elif state == 'a':
                              aadd(fn)
                          elif state == 'r':
                              radd(fn)
                      return (lookup, modified, added, removed, deleted, unknown, ignored,
                              clean)

mercurial/parsers.c

0 +151 0

              /*
               parsers.c - efficient content parsing
               Copyright 2008 Matt Mackall <mpm@selenic.com> and others
               This software may be used and distributed according to the terms of
               the GNU General Public License, incorporated herein by reference.
              */
              #include <Python.h>
              #include <ctype.h>
              #include <string.h>
              #include "util.h"
              static inline int hexdigit(const char *p, Py_ssize_t off)
              {
              	char c = p[off];
              	if (c >= '0' && c <= '9')
              		return c - '0';
              	if (c >= 'a' && c <= 'f')
              		return c - 'a' + 10;
              	if (c >= 'A' && c <= 'F')
              		return c - 'A' + 10;
              	PyErr_SetString(PyExc_ValueError, "input contains non-hex character");
              	return 0;
              }
              /*
               * Turn a hex-encoded string into binary.
               */
              static PyObject *unhexlify(const char *str, int len)
              {
              	PyObject *ret;
              	char *d;
              	int i;
              	ret = PyBytes_FromStringAndSize(NULL, len / 2);
              	if (!ret)
              		return NULL;
              	d = PyBytes_AsString(ret);
              	for (i = 0; i < len;) {
              		int hi = hexdigit(str, i++);
              		int lo = hexdigit(str, i++);
              		*d++ = (hi << 4) | lo;
              	}
              	return ret;
              }
              /*
               * This code assumes that a manifest is stitched together with newline
               * ('\n') characters.
               */
              static PyObject *parse_manifest(PyObject *self, PyObject *args)
              {
              	PyObject *mfdict, *fdict;
              	char *str, *cur, *start, *zero;
              	int len;
              	if (!PyArg_ParseTuple(args, "O!O!s#:parse_manifest",
              			      &PyDict_Type, &mfdict,
              			      &PyDict_Type, &fdict,
              			      &str, &len))
              		goto quit;
              	for (start = cur = str, zero = NULL; cur < str + len; cur++) {
              		PyObject *file = NULL, *node = NULL;
              		PyObject *flags = NULL;
              		int nlen;
              		if (!*cur) {
              			zero = cur;
              			continue;
              		}
              		else if (*cur != '\n')
              			continue;
              		if (!zero) {
              			PyErr_SetString(PyExc_ValueError,
              					"manifest entry has no separator");
              			goto quit;
              		}
              		file = PyBytes_FromStringAndSize(start, zero - start);
              		if (!file)
              			goto bail;
              		nlen = cur - zero - 1;
              		node = unhexlify(zero + 1, nlen > 40 ? 40 : nlen);
              		if (!node)
              			goto bail;
              		if (nlen > 40) {
              			flags = PyBytes_FromStringAndSize(zero + 41,
              							   nlen - 40);
              			if (!flags)
              				goto bail;
              			if (PyDict_SetItem(fdict, file, flags) == -1)
              				goto bail;
              		}
              		if (PyDict_SetItem(mfdict, file, node) == -1)
              			goto bail;
              		start = cur + 1;
              		zero = NULL;
              		Py_XDECREF(flags);
              		Py_XDECREF(node);
              		Py_XDECREF(file);
              		continue;
              	bail:
              		Py_XDECREF(flags);
              		Py_XDECREF(node);
              		Py_XDECREF(file);
              		goto quit;
              	}
              	if (len > 0 && *(cur - 1) != '\n') {
              		PyErr_SetString(PyExc_ValueError,
              				"manifest contains trailing garbage");
              		goto quit;
              	}
              	Py_INCREF(Py_None);
              	return Py_None;
              quit:
              	return NULL;
              }
              static PyObject *parse_dirstate(PyObject *self, PyObject *args)
              {
              	PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
              	PyObject *fname = NULL, *cname = NULL, *entry = NULL;
              	char *str, *cur, *end, *cpos;
              	int state, mode, size, mtime;
              	unsigned int flen;
              	int len;
              	if (!PyArg_ParseTuple(args, "O!O!s#:parse_dirstate",
              			      &PyDict_Type, &dmap,
              			      &PyDict_Type, &cmap,
              			      &str, &len))
              		goto quit;
              	/* read parents */
              	if (len < 40)
              		goto quit;
              	parents = Py_BuildValue("s#s#", str, 20, str + 20, 20);
              	if (!parents)
              		goto quit;
              	/* read filenames */
              	cur = str + 40;
              	end = str + len;
              	while (cur < end - 17) {
              		/* unpack header */
              		state = *cur;
              		mode = getbe32(cur + 1);
              		size = getbe32(cur + 5);
              		mtime = getbe32(cur + 9);
              		flen = getbe32(cur + 13);
              		cur += 17;
              		if (cur + flen > end || cur + flen < cur) {
              			PyErr_SetString(PyExc_ValueError, "overflow in dirstate");
              			goto quit;
              		}
              		entry = Py_BuildValue("ciii", state, mode, size, mtime);
              		if (!entry)
              			goto quit;
              		PyObject_GC_UnTrack(entry); /* don't waste time with this */
              		cpos = memchr(cur, 0, flen);
              		if (cpos) {
              			fname = PyBytes_FromStringAndSize(cur, cpos - cur);
              			cname = PyBytes_FromStringAndSize(cpos + 1,
              							   flen - (cpos - cur) - 1);
              			if (!fname || !cname ||
              			    PyDict_SetItem(cmap, fname, cname) == -1 ||
              			    PyDict_SetItem(dmap, fname, entry) == -1)
              				goto quit;
              			Py_DECREF(cname);
              		} else {
              			fname = PyBytes_FromStringAndSize(cur, flen);
              			if (!fname ||
              			    PyDict_SetItem(dmap, fname, entry) == -1)
              				goto quit;
              		}
              		cur += flen;
              		Py_DECREF(fname);
              		Py_DECREF(entry);
              		fname = cname = entry = NULL;
              	}
              	ret = parents;
              	Py_INCREF(ret);
              quit:
              	Py_XDECREF(fname);
              	Py_XDECREF(cname);
              	Py_XDECREF(entry);
              	Py_XDECREF(parents);
              	return ret;
              }
+             static inline int getintat(PyObject *tuple, int off, uint32_t *v)
+             {
+             	PyObject *o = PyTuple_GET_ITEM(tuple, off);
+             	long val;
+             	if (PyInt_Check(o))
+             		val = PyInt_AS_LONG(o);
+             	else if (PyLong_Check(o)) {
+             		val = PyLong_AsLong(o);
+             		if (val == -1 && PyErr_Occurred())
+             			return -1;
+             	} else {
+             		PyErr_SetString(PyExc_TypeError, "expected an int or long");
+             		return -1;
+             	}
+             	if (LONG_MAX > INT_MAX && (val > INT_MAX || val < INT_MIN)) {
+             		PyErr_SetString(PyExc_OverflowError,
+             				"Python value to large to convert to uint32_t");
+             		return -1;
+             	}
+             	*v = (uint32_t)val;
+             	return 0;
+             }
+             static PyObject *dirstate_unset;
+             /*
+              * Efficiently pack a dirstate object into its on-disk format.
+              */
+             static PyObject *pack_dirstate(PyObject *self, PyObject *args)
+             {
+             	PyObject *packobj = NULL;
+             	PyObject *map, *copymap, *pl;
+             	Py_ssize_t nbytes, pos, l;
+             	PyObject *k, *v, *pn;
+             	char *p, *s;
+             	double now;
+             	if (!PyArg_ParseTuple(args, "O!O!Od:pack_dirstate",
+             			      &PyDict_Type, &map, &PyDict_Type, &copymap,
+             			      &pl, &now))
+             		return NULL;
+             	if (!PySequence_Check(pl) || PySequence_Size(pl) != 2) {
+             		PyErr_SetString(PyExc_TypeError, "expected 2-element sequence");
+             		return NULL;
+             	}
+             	/* Figure out how much we need to allocate. */
+             	for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
+             		PyObject *c;
+             		if (!PyString_Check(k)) {
+             			PyErr_SetString(PyExc_TypeError, "expected string key");
+             			goto bail;
+             		}
+             		nbytes += PyString_GET_SIZE(k) + 17;
+             		c = PyDict_GetItem(copymap, k);
+             		if (c) {
+             			if (!PyString_Check(c)) {
+             				PyErr_SetString(PyExc_TypeError,
+             						"expected string key");
+             				goto bail;
+             			}
+             			nbytes += PyString_GET_SIZE(c) + 1;
+             		}
+             	}
+             	packobj = PyString_FromStringAndSize(NULL, nbytes);
+             	if (packobj == NULL)
+             		goto bail;
+             	p = PyString_AS_STRING(packobj);
+             	pn = PySequence_ITEM(pl, 0);
+             	if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
+             		PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
+             		goto bail;
+             	}
+             	memcpy(p, s, l);
+             	p += 20;
+             	pn = PySequence_ITEM(pl, 1);
+             	if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
+             		PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
+             		goto bail;
+             	}
+             	memcpy(p, s, l);
+             	p += 20;
+             	for (pos = 0; PyDict_Next(map, &pos, &k, &v); ) {
+             		uint32_t mode, size, mtime;
+             		Py_ssize_t len, l;
+             		PyObject *o;
+             		char *s, *t;
+             		int err;
+             		if (!PyTuple_Check(v) || PyTuple_GET_SIZE(v) != 4) {
+             			PyErr_SetString(PyExc_TypeError, "expected a 4-tuple");
+             			goto bail;
+             		}
+             		o = PyTuple_GET_ITEM(v, 0);
+             		if (PyString_AsStringAndSize(o, &s, &l) == -1 || l != 1) {
+             			PyErr_SetString(PyExc_TypeError, "expected one byte");
+             			goto bail;
+             		}
+             		*p++ = *s;
+             		err = getintat(v, 1, &mode);
+             		err |= getintat(v, 2, &size);
+             		err |= getintat(v, 3, &mtime);
+             		if (err)
+             			goto bail;
+             		if (*s == 'n' && mtime == (uint32_t)now) {
+             			/* See dirstate.py:write for why we do this. */
+             			if (PyDict_SetItem(map, k, dirstate_unset) == -1)
+             				goto bail;
+             			mode = 0, size = -1, mtime = -1;
+             		}
+             		putbe32(mode, p);
+             		putbe32(size, p + 4);
+             		putbe32(mtime, p + 8);
+             		t = p + 12;
+             		p += 16;
+             		len = PyString_GET_SIZE(k);
+             		memcpy(p, PyString_AS_STRING(k), len);
+             		p += len;
+             		o = PyDict_GetItem(copymap, k);
+             		if (o) {
+             			*p++ = '\0';
+             			l = PyString_GET_SIZE(o);
+             			memcpy(p, PyString_AS_STRING(o), l);
+             			p += l;
+             			len += l + 1;
+             		}
+             		putbe32((uint32_t)len, t);
+             	}
+             	pos = p - PyString_AS_STRING(packobj);
+             	if (pos != nbytes) {
+             		PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
+                                          (long)pos, (long)nbytes);
+             		goto bail;
+             	}
+             	return packobj;
+             bail:
+             	Py_XDECREF(packobj);
+             	return NULL;
+             }
              /*
               * A base-16 trie for fast node->rev mapping.
               *
               * Positive value is index of the next node in the trie
               * Negative value is a leaf: -(rev + 1)
               * Zero is empty
               */
              typedef struct {
              	int children[16];
              } nodetree;
              /*
               * This class has two behaviours.
               *
               * When used in a list-like way (with integer keys), we decode an
               * entry in a RevlogNG index file on demand. Our last entry is a
               * sentinel, always a nullid.  We have limited support for
               * integer-keyed insert and delete, only at elements right before the
               * sentinel.
               *
               * With string keys, we lazily perform a reverse mapping from node to
               * rev, using a base-16 trie.
               */
              typedef struct {
              	PyObject_HEAD
              	/* Type-specific fields go here. */
              	PyObject *data;        /* raw bytes of index */
              	PyObject **cache;      /* cached tuples */
              	const char **offsets;  /* populated on demand */
              	Py_ssize_t raw_length; /* original number of elements */
              	Py_ssize_t length;     /* current number of elements */
              	PyObject *added;       /* populated on demand */
              	PyObject *headrevs;    /* cache, invalidated on changes */
              	nodetree *nt;          /* base-16 trie */
              	int ntlength;          /* # nodes in use */
              	int ntcapacity;        /* # nodes allocated */
              	int ntdepth;           /* maximum depth of tree */
              	int ntsplits;          /* # splits performed */
              	int ntrev;             /* last rev scanned */
              	int ntlookups;         /* # lookups */
              	int ntmisses;          /* # lookups that miss the cache */
              	int inlined;
              } indexObject;
              static Py_ssize_t index_length(const indexObject *self)
              {
              	if (self->added == NULL)
              		return self->length;
              	return self->length + PyList_GET_SIZE(self->added);
              }
              static PyObject *nullentry;
              static const char nullid[20];
              static long inline_scan(indexObject *self, const char **offsets);
              #if LONG_MAX == 0x7fffffffL
              static char *tuple_format = "Kiiiiiis#";
              #else
              static char *tuple_format = "kiiiiiis#";
              #endif
              /* A RevlogNG v1 index entry is 64 bytes long. */
              static const long v1_hdrsize = 64;
              /*
               * Return a pointer to the beginning of a RevlogNG record.
               */
              static const char *index_deref(indexObject *self, Py_ssize_t pos)
              {
              	if (self->inlined && pos > 0) {
              		if (self->offsets == NULL) {
              			self->offsets = malloc(self->raw_length *
              					       sizeof(*self->offsets));
              			if (self->offsets == NULL)
              				return (const char *)PyErr_NoMemory();
              			inline_scan(self, self->offsets);
              		}
              		return self->offsets[pos];
              	}
              	return PyString_AS_STRING(self->data) + pos * v1_hdrsize;
              }
              /*
               * RevlogNG format (all in big endian, data may be inlined):
               *    6 bytes: offset
               *    2 bytes: flags
               *    4 bytes: compressed length
               *    4 bytes: uncompressed length
               *    4 bytes: base revision
               *    4 bytes: link revision
               *    4 bytes: parent 1 revision
               *    4 bytes: parent 2 revision
               *   32 bytes: nodeid (only 20 bytes used)
               */
              static PyObject *index_get(indexObject *self, Py_ssize_t pos)
              {
              	uint64_t offset_flags;
              	int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
              	const char *c_node_id;
              	const char *data;
              	Py_ssize_t length = index_length(self);
              	PyObject *entry;
              	if (pos < 0)
              		pos += length;
              	if (pos < 0 || pos >= length) {
              		PyErr_SetString(PyExc_IndexError, "revlog index out of range");
              		return NULL;
              	}
              	if (pos == length - 1) {
              		Py_INCREF(nullentry);
              		return nullentry;
              	}
              	if (pos >= self->length - 1) {
              		PyObject *obj;
              		obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
              		Py_INCREF(obj);
              		return obj;
              	}
              	if (self->cache) {
              		if (self->cache[pos]) {
              			Py_INCREF(self->cache[pos]);
              			return self->cache[pos];
              		}
              	} else {
              		self->cache = calloc(self->raw_length, sizeof(PyObject *));
              		if (self->cache == NULL)
              			return PyErr_NoMemory();
              	}
              	data = index_deref(self, pos);
              	if (data == NULL)
              		return NULL;
              	offset_flags = getbe32(data + 4);
              	if (pos == 0) /* mask out version number for the first entry */
              		offset_flags &= 0xFFFF;
              	else {
              		uint32_t offset_high = getbe32(data);
              		offset_flags |= ((uint64_t)offset_high) << 32;
              	}
              	comp_len = getbe32(data + 8);
              	uncomp_len = getbe32(data + 12);
              	base_rev = getbe32(data + 16);
              	link_rev = getbe32(data + 20);
              	parent_1 = getbe32(data + 24);
              	parent_2 = getbe32(data + 28);
              	c_node_id = data + 32;
              	entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
              			      uncomp_len, base_rev, link_rev,
              			      parent_1, parent_2, c_node_id, 20);
              	if (entry)
              		PyObject_GC_UnTrack(entry);
              	self->cache[pos] = entry;
              	Py_INCREF(entry);
              	return entry;
              }
              /*
               * Return the 20-byte SHA of the node corresponding to the given rev.
               */
              static const char *index_node(indexObject *self, Py_ssize_t pos)
              {
              	Py_ssize_t length = index_length(self);
              	const char *data;
              	if (pos == length - 1 || pos == INT_MAX)
              		return nullid;
              	if (pos >= length)
              		return NULL;
              	if (pos >= self->length - 1) {
              		PyObject *tuple, *str;
              		tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
              		str = PyTuple_GetItem(tuple, 7);
              		return str ? PyString_AS_STRING(str) : NULL;
              	}
              	data = index_deref(self, pos);
              	return data ? data + 32 : NULL;
              }
              static int nt_insert(indexObject *self, const char *node, int rev);
              static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
              {
              	if (PyString_AsStringAndSize(obj, node, nodelen) == -1)
              		return -1;
              	if (*nodelen == 20)
              		return 0;
              	PyErr_SetString(PyExc_ValueError, "20-byte hash required");
              	return -1;
              }
              static PyObject *index_insert(indexObject *self, PyObject *args)
              {
              	PyObject *obj;
              	char *node;
              	long offset;
              	Py_ssize_t len, nodelen;
              	if (!PyArg_ParseTuple(args, "lO", &offset, &obj))
              		return NULL;
              	if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
              		PyErr_SetString(PyExc_TypeError, "8-tuple required");
              		return NULL;
              	}
              	if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
              		return NULL;
              	len = index_length(self);
              	if (offset < 0)
              		offset += len;
              	if (offset != len - 1) {
              		PyErr_SetString(PyExc_IndexError,
              				"insert only supported at index -1");
              		return NULL;
              	}
              	if (offset > INT_MAX) {
              		PyErr_SetString(PyExc_ValueError,
              				"currently only 2**31 revs supported");
              		return NULL;
              	}
              	if (self->added == NULL) {
              		self->added = PyList_New(0);
              		if (self->added == NULL)
              			return NULL;
              	}
              	if (PyList_Append(self->added, obj) == -1)
              		return NULL;
              	if (self->nt)
              		nt_insert(self, node, (int)offset);
              	Py_CLEAR(self->headrevs);
              	Py_RETURN_NONE;
              }
              static void _index_clearcaches(indexObject *self)
              {
              	if (self->cache) {
              		Py_ssize_t i;
              		for (i = 0; i < self->raw_length; i++)
              			Py_CLEAR(self->cache[i]);
              		free(self->cache);
              		self->cache = NULL;
              	}
              	if (self->offsets) {
              		free(self->offsets);
              		self->offsets = NULL;
              	}
              	if (self->nt) {
              		free(self->nt);
              		self->nt = NULL;
              	}
              	Py_CLEAR(self->headrevs);
              }
              static PyObject *index_clearcaches(indexObject *self)
              {
              	_index_clearcaches(self);
              	self->ntlength = self->ntcapacity = 0;
              	self->ntdepth = self->ntsplits = 0;
              	self->ntrev = -1;
              	self->ntlookups = self->ntmisses = 0;
              	Py_RETURN_NONE;
              }
              static PyObject *index_stats(indexObject *self)
              {
              	PyObject *obj = PyDict_New();
              	if (obj == NULL)
              		return NULL;
              #define istat(__n, __d) \
              	if (PyDict_SetItemString(obj, __d, PyInt_FromSsize_t(self->__n)) == -1) \
              		goto bail;
              	if (self->added) {
              		Py_ssize_t len = PyList_GET_SIZE(self->added);
              		if (PyDict_SetItemString(obj, "index entries added",
              					 PyInt_FromSsize_t(len)) == -1)
              			goto bail;
              	}
              	if (self->raw_length != self->length - 1)
              		istat(raw_length, "revs on disk");
              	istat(length, "revs in memory");
              	istat(ntcapacity, "node trie capacity");
              	istat(ntdepth, "node trie depth");
              	istat(ntlength, "node trie count");
              	istat(ntlookups, "node trie lookups");
              	istat(ntmisses, "node trie misses");
              	istat(ntrev, "node trie last rev scanned");
              	istat(ntsplits, "node trie splits");
              #undef istat
              	return obj;
              bail:
              	Py_XDECREF(obj);
              	return NULL;
              }
              /*
               * When we cache a list, we want to be sure the caller can't mutate
               * the cached copy.
               */
              static PyObject *list_copy(PyObject *list)
              {
              	Py_ssize_t len = PyList_GET_SIZE(list);
              	PyObject *newlist = PyList_New(len);
              	Py_ssize_t i;
              	if (newlist == NULL)
              		return NULL;
              	for (i = 0; i < len; i++) {
              		PyObject *obj = PyList_GET_ITEM(list, i);
              		Py_INCREF(obj);
              		PyList_SET_ITEM(newlist, i, obj);
              	}
              	return newlist;
              }
              static PyObject *index_headrevs(indexObject *self)
              {
              	Py_ssize_t i, len, addlen;
              	char *nothead = NULL;
              	PyObject *heads;
              	if (self->headrevs)
              		return list_copy(self->headrevs);
              	len = index_length(self) - 1;
              	heads = PyList_New(0);
              	if (heads == NULL)
              		goto bail;
              	if (len == 0) {
              		PyObject *nullid = PyInt_FromLong(-1);
              		if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
              			Py_XDECREF(nullid);
              			goto bail;
              		}
              		goto done;
              	}
              	nothead = calloc(len, 1);
              	if (nothead == NULL)
              		goto bail;
              	for (i = 0; i < self->raw_length; i++) {
              		const char *data = index_deref(self, i);
              		int parent_1 = getbe32(data + 24);
              		int parent_2 = getbe32(data + 28);
              		if (parent_1 >= 0)
              			nothead[parent_1] = 1;
              		if (parent_2 >= 0)
              			nothead[parent_2] = 1;
              	}
              	addlen = self->added ? PyList_GET_SIZE(self->added) : 0;
              	for (i = 0; i < addlen; i++) {
              		PyObject *rev = PyList_GET_ITEM(self->added, i);
              		PyObject *p1 = PyTuple_GET_ITEM(rev, 5);
              		PyObject *p2 = PyTuple_GET_ITEM(rev, 6);
              		long parent_1, parent_2;
              		if (!PyInt_Check(p1) || !PyInt_Check(p2)) {
              			PyErr_SetString(PyExc_TypeError,
              					"revlog parents are invalid");
              			goto bail;
              		}
              		parent_1 = PyInt_AS_LONG(p1);
              		parent_2 = PyInt_AS_LONG(p2);
              		if (parent_1 >= 0)
              			nothead[parent_1] = 1;
              		if (parent_2 >= 0)
              			nothead[parent_2] = 1;
              	}
              	for (i = 0; i < len; i++) {
              		PyObject *head;
              		if (nothead[i])
              			continue;
              		head = PyInt_FromLong(i);
              		if (head == NULL || PyList_Append(heads, head) == -1) {
              			Py_XDECREF(head);
              			goto bail;
              		}
              	}
              done:
              	self->headrevs = heads;
              	free(nothead);
              	return list_copy(self->headrevs);
              bail:
              	Py_XDECREF(heads);
              	free(nothead);
              	return NULL;
              }
              static inline int nt_level(const char *node, Py_ssize_t level)
              {
              	int v = node[level>>1];
              	if (!(level & 1))
              		v >>= 4;
              	return v & 0xf;
              }
              /*
               * Return values:
               *
               *   -4: match is ambiguous (multiple candidates)
               *   -2: not found
               * rest: valid rev
               */
              static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
              		   int hex)
              {
              	int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
              	int level, maxlevel, off;
              	if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
              		return -1;
              	if (self->nt == NULL)
              		return -2;
              	if (hex)
              		maxlevel = nodelen > 40 ? 40 : (int)nodelen;
              	else
              		maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
              	for (level = off = 0; level < maxlevel; level++) {
              		int k = getnybble(node, level);
              		nodetree *n = &self->nt[off];
              		int v = n->children[k];
              		if (v < 0) {
              			const char *n;
              			Py_ssize_t i;
              			v = -v - 1;
              			n = index_node(self, v);
              			if (n == NULL)
              				return -2;
              			for (i = level; i < maxlevel; i++)
              				if (getnybble(node, i) != nt_level(n, i))
              					return -2;
              			return v;
              		}
              		if (v == 0)
              			return -2;
              		off = v;
              	}
              	/* multiple matches against an ambiguous prefix */
              	return -4;
              }
              static int nt_new(indexObject *self)
              {
              	if (self->ntlength == self->ntcapacity) {
              		self->ntcapacity *= 2;
              		self->nt = realloc(self->nt,
              				   self->ntcapacity * sizeof(nodetree));
              		if (self->nt == NULL) {
              			PyErr_SetString(PyExc_MemoryError, "out of memory");
              			return -1;
              		}
              		memset(&self->nt[self->ntlength], 0,
              		       sizeof(nodetree) * (self->ntcapacity - self->ntlength));
              	}
              	return self->ntlength++;
              }
              static int nt_insert(indexObject *self, const char *node, int rev)
              {
              	int level = 0;
              	int off = 0;
              	while (level < 40) {
              		int k = nt_level(node, level);
              		nodetree *n;
              		int v;
              		n = &self->nt[off];
              		v = n->children[k];
              		if (v == 0) {
              			n->children[k] = -rev - 1;
              			return 0;
              		}
              		if (v < 0) {
              			const char *oldnode = index_node(self, -v - 1);
              			int noff;
              			if (!oldnode || !memcmp(oldnode, node, 20)) {
              				n->children[k] = -rev - 1;
              				return 0;
              			}
              			noff = nt_new(self);
              			if (noff == -1)
              				return -1;
              			/* self->nt may have been changed by realloc */
              			self->nt[off].children[k] = noff;
              			off = noff;
              			n = &self->nt[off];
              			n->children[nt_level(oldnode, ++level)] = v;
              			if (level > self->ntdepth)
              				self->ntdepth = level;
              			self->ntsplits += 1;
              		} else {
              			level += 1;
              			off = v;
              		}
              	}
              	return -1;
              }
              static int nt_init(indexObject *self)
              {
              	if (self->nt == NULL) {
              		self->ntcapacity = self->raw_length < 4
              			? 4 : self->raw_length / 2;
              		self->nt = calloc(self->ntcapacity, sizeof(nodetree));
              		if (self->nt == NULL) {
              			PyErr_NoMemory();
              			return -1;
              		}
              		self->ntlength = 1;
              		self->ntrev = (int)index_length(self) - 1;
              		self->ntlookups = 1;
              		self->ntmisses = 0;
              		if (nt_insert(self, nullid, INT_MAX) == -1)
              			return -1;
              	}
              	return 0;
              }
              /*
               * Return values:
               *
               *   -3: error (exception set)
               *   -2: not found (no exception set)
               * rest: valid rev
               */
              static int index_find_node(indexObject *self,
              			   const char *node, Py_ssize_t nodelen)
              {
              	int rev;
              	self->ntlookups++;
              	rev = nt_find(self, node, nodelen, 0);
              	if (rev >= -1)
              		return rev;
              	if (nt_init(self) == -1)
              		return -3;
              	/*
              	 * For the first handful of lookups, we scan the entire index,
              	 * and cache only the matching nodes. This optimizes for cases
              	 * like "hg tip", where only a few nodes are accessed.
              	 *
              	 * After that, we cache every node we visit, using a single
              	 * scan amortized over multiple lookups.  This gives the best
              	 * bulk performance, e.g. for "hg log".
              	 */
              	if (self->ntmisses++ < 4) {
              		for (rev = self->ntrev - 1; rev >= 0; rev--) {
              			const char *n = index_node(self, rev);
              			if (n == NULL)
              				return -2;
              			if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
              				if (nt_insert(self, n, rev) == -1)
              					return -3;
              				break;
              			}
              		}
              	} else {
              		for (rev = self->ntrev - 1; rev >= 0; rev--) {
              			const char *n = index_node(self, rev);
              			if (n == NULL) {
              				self->ntrev = rev + 1;
              				return -2;
              			}
              			if (nt_insert(self, n, rev) == -1) {
              				self->ntrev = rev + 1;
              				return -3;
              			}
              			if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
              				break;
              			}
              		}
              		self->ntrev = rev;
              	}
              	if (rev >= 0)
              		return rev;
              	return -2;
              }
              static PyObject *raise_revlog_error(void)
              {
              	static PyObject *errclass;
              	PyObject *mod = NULL, *errobj;
              	if (errclass == NULL) {
              		PyObject *dict;
              		mod = PyImport_ImportModule("mercurial.error");
              		if (mod == NULL)
              			goto classfail;
              		dict = PyModule_GetDict(mod);
              		if (dict == NULL)
              			goto classfail;
              		errclass = PyDict_GetItemString(dict, "RevlogError");
              		if (errclass == NULL) {
              			PyErr_SetString(PyExc_SystemError,
              					"could not find RevlogError");
              			goto classfail;
              		}
              		Py_INCREF(errclass);
              	}
              	errobj = PyObject_CallFunction(errclass, NULL);
              	if (errobj == NULL)
              		return NULL;
              	PyErr_SetObject(errclass, errobj);
              	return errobj;
              classfail:
              	Py_XDECREF(mod);
              	return NULL;
              }
              static PyObject *index_getitem(indexObject *self, PyObject *value)
              {
              	char *node;
              	Py_ssize_t nodelen;
              	int rev;
              	if (PyInt_Check(value))
              		return index_get(self, PyInt_AS_LONG(value));
              	if (node_check(value, &node, &nodelen) == -1)
              		return NULL;
              	rev = index_find_node(self, node, nodelen);
              	if (rev >= -1)
              		return PyInt_FromLong(rev);
              	if (rev == -2)
              		raise_revlog_error();
              	return NULL;
              }
              static int nt_partialmatch(indexObject *self, const char *node,
              			   Py_ssize_t nodelen)
              {
              	int rev;
              	if (nt_init(self) == -1)
              		return -3;
              	if (self->ntrev > 0) {
              		/* ensure that the radix tree is fully populated */
              		for (rev = self->ntrev - 1; rev >= 0; rev--) {
              			const char *n = index_node(self, rev);
              			if (n == NULL)
              				return -2;
              			if (nt_insert(self, n, rev) == -1)
              				return -3;
              		}
              		self->ntrev = rev;
              	}
              	return nt_find(self, node, nodelen, 1);
              }
              static PyObject *index_partialmatch(indexObject *self, PyObject *args)
              {
              	const char *fullnode;
              	int nodelen;
              	char *node;
              	int rev, i;
              	if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
              		return NULL;
              	if (nodelen < 4) {
              		PyErr_SetString(PyExc_ValueError, "key too short");
              		return NULL;
              	}
              	if (nodelen > 40)
              		nodelen = 40;
              	for (i = 0; i < nodelen; i++)
              		hexdigit(node, i);
              	if (PyErr_Occurred()) {
              		/* input contains non-hex characters */
              		PyErr_Clear();
              		Py_RETURN_NONE;
              	}
              	rev = nt_partialmatch(self, node, nodelen);
              	switch (rev) {
              	case -4:
              		raise_revlog_error();
              	case -3:
              		return NULL;
              	case -2:
              		Py_RETURN_NONE;
              	case -1:
              		return PyString_FromStringAndSize(nullid, 20);
              	}
              	fullnode = index_node(self, rev);
              	if (fullnode == NULL) {
              		PyErr_Format(PyExc_IndexError,
              			     "could not access rev %d", rev);
              		return NULL;
              	}
              	return PyString_FromStringAndSize(fullnode, 20);
              }
              static PyObject *index_m_get(indexObject *self, PyObject *args)
              {
              	Py_ssize_t nodelen;
              	PyObject *val;
              	char *node;
              	int rev;
              	if (!PyArg_ParseTuple(args, "O", &val))
              		return NULL;
              	if (node_check(val, &node, &nodelen) == -1)
              		return NULL;
              	rev = index_find_node(self, node, nodelen);
              	if (rev ==  -3)
              		return NULL;
              	if (rev == -2)
              		Py_RETURN_NONE;
              	return PyInt_FromLong(rev);
              }
              static int index_contains(indexObject *self, PyObject *value)
              {
              	char *node;
              	Py_ssize_t nodelen;
              	if (PyInt_Check(value)) {
              		long rev = PyInt_AS_LONG(value);
              		return rev >= -1 && rev < index_length(self);
              	}
              	if (node_check(value, &node, &nodelen) == -1)
              		return -1;
              	switch (index_find_node(self, node, nodelen)) {
              	case -3:
              		return -1;
              	case -2:
              		return 0;
              	default:
              		return 1;
              	}
              }
              /*
               * Invalidate any trie entries introduced by added revs.
               */
              static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
              {
              	Py_ssize_t i, len = PyList_GET_SIZE(self->added);
              	for (i = start; i < len; i++) {
              		PyObject *tuple = PyList_GET_ITEM(self->added, i);
              		PyObject *node = PyTuple_GET_ITEM(tuple, 7);
              		nt_insert(self, PyString_AS_STRING(node), -1);
              	}
              	if (start == 0)
              		Py_CLEAR(self->added);
              }
              /*
               * Delete a numeric range of revs, which must be at the end of the
               * range, but exclude the sentinel nullid entry.
               */
              static int index_slice_del(indexObject *self, PyObject *item)
              {
              	Py_ssize_t start, stop, step, slicelength;
              	Py_ssize_t length = index_length(self);
              	int ret = 0;
              	if (PySlice_GetIndicesEx((PySliceObject*)item, length,
              				 &start, &stop, &step, &slicelength) < 0)
              		return -1;
              	if (slicelength <= 0)
              		return 0;
              	if ((step < 0 && start < stop) || (step > 0 && start > stop))
              		stop = start;
              	if (step < 0) {
              		stop = start + 1;
              		start = stop + step*(slicelength - 1) - 1;
              		step = -step;
              	}
              	if (step != 1) {
              		PyErr_SetString(PyExc_ValueError,
              				"revlog index delete requires step size of 1");
              		return -1;
              	}
              	if (stop != length - 1) {
              		PyErr_SetString(PyExc_IndexError,
              				"revlog index deletion indices are invalid");
              		return -1;
              	}
              	if (start < self->length - 1) {
              		if (self->nt) {
              			Py_ssize_t i;
              			for (i = start + 1; i < self->length - 1; i++) {
              				const char *node = index_node(self, i);
              				if (node)
              					nt_insert(self, node, -1);
              			}
              			if (self->added)
              				nt_invalidate_added(self, 0);
              			if (self->ntrev > start)
              				self->ntrev = (int)start;
              		}
              		self->length = start + 1;
              		if (start < self->raw_length)
              			self->raw_length = start;
              		goto done;
              	}
              	if (self->nt) {
              		nt_invalidate_added(self, start - self->length + 1);
              		if (self->ntrev > start)
              			self->ntrev = (int)start;
              	}
              	if (self->added)
              		ret = PyList_SetSlice(self->added, start - self->length + 1,
              				      PyList_GET_SIZE(self->added), NULL);
              done:
              	Py_CLEAR(self->headrevs);
              	return ret;
              }
              /*
               * Supported ops:
               *
               * slice deletion
               * string assignment (extend node->rev mapping)
               * string deletion (shrink node->rev mapping)
               */
              static int index_assign_subscript(indexObject *self, PyObject *item,
              				  PyObject *value)
              {
              	char *node;
              	Py_ssize_t nodelen;
              	long rev;
              	if (PySlice_Check(item) && value == NULL)
              		return index_slice_del(self, item);
              	if (node_check(item, &node, &nodelen) == -1)
              		return -1;
              	if (value == NULL)
              		return self->nt ? nt_insert(self, node, -1) : 0;
              	rev = PyInt_AsLong(value);
              	if (rev > INT_MAX || rev < 0) {
              		if (!PyErr_Occurred())
              			PyErr_SetString(PyExc_ValueError, "rev out of range");
              		return -1;
              	}
              	return nt_insert(self, node, (int)rev);
              }
              /*
               * Find all RevlogNG entries in an index that has inline data. Update
               * the optional "offsets" table with those entries.
               */
              static long inline_scan(indexObject *self, const char **offsets)
              {
              	const char *data = PyString_AS_STRING(self->data);
              	const char *end = data + PyString_GET_SIZE(self->data);
              	long incr = v1_hdrsize;
              	Py_ssize_t len = 0;
              	while (data + v1_hdrsize <= end) {
              		uint32_t comp_len;
              		const char *old_data;
              		/* 3rd element of header is length of compressed inline data */
              		comp_len = getbe32(data + 8);
              		incr = v1_hdrsize + comp_len;
              		if (incr < v1_hdrsize)
              			break;
              		if (offsets)
              			offsets[len] = data;
              		len++;
              		old_data = data;
              		data += incr;
              		if (data <= old_data)
              			break;
              	}
              	if (data != end && data + v1_hdrsize != end) {
              		if (!PyErr_Occurred())
              			PyErr_SetString(PyExc_ValueError, "corrupt index file");
              		return -1;
              	}
              	return len;
              }
              static int index_init(indexObject *self, PyObject *args)
              {
              	PyObject *data_obj, *inlined_obj;
              	Py_ssize_t size;
              	if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
              		return -1;
              	if (!PyString_Check(data_obj)) {
              		PyErr_SetString(PyExc_TypeError, "data is not a string");
              		return -1;
              	}
              	size = PyString_GET_SIZE(data_obj);
              	self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
              	self->data = data_obj;
              	self->cache = NULL;
              	self->added = NULL;
              	self->headrevs = NULL;
              	self->offsets = NULL;
              	self->nt = NULL;
              	self->ntlength = self->ntcapacity = 0;
              	self->ntdepth = self->ntsplits = 0;
              	self->ntlookups = self->ntmisses = 0;
              	self->ntrev = -1;
              	Py_INCREF(self->data);
              	if (self->inlined) {
              		long len = inline_scan(self, NULL);
              		if (len == -1)
              			goto bail;
              		self->raw_length = len;
              		self->length = len + 1;
              	} else {
              		if (size % v1_hdrsize) {
              			PyErr_SetString(PyExc_ValueError, "corrupt index file");
              			goto bail;
              		}
              		self->raw_length = size / v1_hdrsize;
              		self->length = self->raw_length + 1;
              	}
              	return 0;
              bail:
              	return -1;
              }
              static PyObject *index_nodemap(indexObject *self)
              {
              	Py_INCREF(self);
              	return (PyObject *)self;
              }
              static void index_dealloc(indexObject *self)
              {
              	_index_clearcaches(self);
              	Py_DECREF(self->data);
              	Py_XDECREF(self->added);
              	PyObject_Del(self);
              }
              static PySequenceMethods index_sequence_methods = {
              	(lenfunc)index_length,   /* sq_length */
 ,                       /* sq_concat */
 ,                       /* sq_repeat */
              	(ssizeargfunc)index_get, /* sq_item */
 ,                       /* sq_slice */
 ,                       /* sq_ass_item */
 ,                       /* sq_ass_slice */
              	(objobjproc)index_contains, /* sq_contains */
              };
              static PyMappingMethods index_mapping_methods = {
              	(lenfunc)index_length,                 /* mp_length */
              	(binaryfunc)index_getitem,             /* mp_subscript */
              	(objobjargproc)index_assign_subscript, /* mp_ass_subscript */
              };
              static PyMethodDef index_methods[] = {
              	{"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
              	 "clear the index caches"},
              	{"get", (PyCFunction)index_m_get, METH_VARARGS,
              	 "get an index entry"},
              	{"headrevs", (PyCFunction)index_headrevs, METH_NOARGS,
              	 "get head revisions"},
              	{"insert", (PyCFunction)index_insert, METH_VARARGS,
              	 "insert an index entry"},
              	{"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
              	 "match a potentially ambiguous node ID"},
              	{"stats", (PyCFunction)index_stats, METH_NOARGS,
              	 "stats for the index"},
              	{NULL} /* Sentinel */
              };
              static PyGetSetDef index_getset[] = {
              	{"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
              	{NULL} /* Sentinel */
              };
              static PyTypeObject indexType = {
              	PyObject_HEAD_INIT(NULL)
 ,                         /* ob_size */
              	"parsers.index",           /* tp_name */
              	sizeof(indexObject),       /* tp_basicsize */
 ,                         /* tp_itemsize */
              	(destructor)index_dealloc, /* tp_dealloc */
 ,                         /* tp_print */
 ,                         /* tp_getattr */
 ,                         /* tp_setattr */
 ,                         /* tp_compare */
 ,                         /* tp_repr */
 ,                         /* tp_as_number */
              	&index_sequence_methods,   /* tp_as_sequence */
              	&index_mapping_methods,    /* tp_as_mapping */
 ,                         /* tp_hash */
 ,                         /* tp_call */
 ,                         /* tp_str */
 ,                         /* tp_getattro */
 ,                         /* tp_setattro */
 ,                         /* tp_as_buffer */
              	Py_TPFLAGS_DEFAULT,        /* tp_flags */
              	"revlog index",            /* tp_doc */
 ,                         /* tp_traverse */
 ,                         /* tp_clear */
 ,                         /* tp_richcompare */
 ,                         /* tp_weaklistoffset */
 ,                         /* tp_iter */
 ,                         /* tp_iternext */
              	index_methods,             /* tp_methods */
 ,                         /* tp_members */
              	index_getset,              /* tp_getset */
 ,                         /* tp_base */
 ,                         /* tp_dict */
 ,                         /* tp_descr_get */
 ,                         /* tp_descr_set */
 ,                         /* tp_dictoffset */
              	(initproc)index_init,      /* tp_init */
 ,                         /* tp_alloc */
              };
              /*
               * returns a tuple of the form (index, index, cache) with elements as
               * follows:
               *
               * index: an index object that lazily parses RevlogNG records
               * cache: if data is inlined, a tuple (index_file_content, 0), else None
               *
               * added complications are for backwards compatibility
               */
              static PyObject *parse_index2(PyObject *self, PyObject *args)
              {
              	PyObject *tuple = NULL, *cache = NULL;
              	indexObject *idx;
              	int ret;
              	idx = PyObject_New(indexObject, &indexType);
              	if (idx == NULL)
              		goto bail;
              	ret = index_init(idx, args);
              	if (ret == -1)
              		goto bail;
              	if (idx->inlined) {
              		cache = Py_BuildValue("iO", 0, idx->data);
              		if (cache == NULL)
              			goto bail;
              	} else {
              		cache = Py_None;
              		Py_INCREF(cache);
              	}
              	tuple = Py_BuildValue("NN", idx, cache);
              	if (!tuple)
              		goto bail;
              	return tuple;
              bail:
              	Py_XDECREF(idx);
              	Py_XDECREF(cache);
              	Py_XDECREF(tuple);
              	return NULL;
              }
              static char parsers_doc[] = "Efficient content parsing.";
              static PyMethodDef methods[] = {
+             	{"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
              	{"parse_manifest", parse_manifest, METH_VARARGS, "parse a manifest\n"},
              	{"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
              	{"parse_index2", parse_index2, METH_VARARGS, "parse a revlog index\n"},
              	{NULL, NULL}
              };
              static void module_init(PyObject *mod)
              {
              	indexType.tp_new = PyType_GenericNew;
              	if (PyType_Ready(&indexType) < 0)
              		return;
              	Py_INCREF(&indexType);
              	PyModule_AddObject(mod, "index", (PyObject *)&indexType);
              	nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
              				  -1, -1, -1, -1, nullid, 20);
              	if (nullentry)
              		PyObject_GC_UnTrack(nullentry);
+             	dirstate_unset = Py_BuildValue("ciii", 'n', 0, -1, -1);
              }
              #ifdef IS_PY3K
              static struct PyModuleDef parsers_module = {
              	PyModuleDef_HEAD_INIT,
              	"parsers",
              	parsers_doc,
              	-1,
              	methods
              };
              PyMODINIT_FUNC PyInit_parsers(void)
              {
              	PyObject *mod = PyModule_Create(&parsers_module);
              	module_init(mod);
              	return mod;
              }
              #else
              PyMODINIT_FUNC initparsers(void)
              {
              	PyObject *mod = Py_InitModule3("parsers", methods, parsers_doc);
              	module_init(mod);
              }
              #endif

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages