upstream/mercurial-mirror Commit - r21809:e250b830

parsers: inline fields of dirstate values in C version...

Siddharth Agarwal -

r21809:e250b830 default

parent child

mercurial/dirs.c

0 +3 -16

              /*
               dirs.c - dynamic directory diddling for dirstates
               Copyright 2013 Facebook
               This software may be used and distributed according to the terms of
               the GNU General Public License, incorporated herein by reference.
              */
              #define PY_SSIZE_T_CLEAN
              #include <Python.h>
              #include "util.h"
              /*
               * This is a multiset of directory names, built from the files that
               * appear in a dirstate or manifest.
               *
               * A few implementation notes:
               *
               * We modify Python integers for refcounting, but those integers are
               * never visible to Python code.
               *
               * We mutate strings in-place, but leave them immutable once they can
               * be seen by Python code.
               */
              typedef struct {
              	PyObject_HEAD
              	PyObject *dict;
              } dirsObject;
              static inline Py_ssize_t _finddir(PyObject *path, Py_ssize_t pos)
              {
              	const char *s = PyString_AS_STRING(path);
              	while (pos != -1) {
              		if (s[pos] == '/')
              			break;
              		pos -= 1;
              	}
              	return pos;
              }
              static int _addpath(PyObject *dirs, PyObject *path)
              {
              	const char *cpath = PyString_AS_STRING(path);
              	Py_ssize_t pos = PyString_GET_SIZE(path);
              	PyObject *key = NULL;
              	int ret = -1;
              	while ((pos = _finddir(path, pos - 1)) != -1) {
              		PyObject *val;
              		/* It's likely that every prefix already has an entry
              		   in our dict. Try to avoid allocating and
              		   deallocating a string for each prefix we check. */
              		if (key != NULL)
              			((PyStringObject *)key)->ob_shash = -1;
              		else {
              			/* Force Python to not reuse a small shared string. */
              			key = PyString_FromStringAndSize(cpath,
              							 pos < 2 ? 2 : pos);
              			if (key == NULL)
              				goto bail;
              		}
              		PyString_GET_SIZE(key) = pos;
              		PyString_AS_STRING(key)[pos] = '\0';
              		val = PyDict_GetItem(dirs, key);
              		if (val != NULL) {
              			PyInt_AS_LONG(val) += 1;
              			continue;
              		}
              		/* Force Python to not reuse a small shared int. */
              		val = PyInt_FromLong(0x1eadbeef);
              		if (val == NULL)
              			goto bail;
              		PyInt_AS_LONG(val) = 1;
              		ret = PyDict_SetItem(dirs, key, val);
              		Py_DECREF(val);
              		if (ret == -1)
              			goto bail;
              		Py_CLEAR(key);
              	}
              	ret = 0;
              bail:
              	Py_XDECREF(key);
              	return ret;
              }
              static int _delpath(PyObject *dirs, PyObject *path)
              {
              	Py_ssize_t pos = PyString_GET_SIZE(path);
              	PyObject *key = NULL;
              	int ret = -1;
              	while ((pos = _finddir(path, pos - 1)) != -1) {
              		PyObject *val;
              		key = PyString_FromStringAndSize(PyString_AS_STRING(path), pos);
              		if (key == NULL)
              			goto bail;
              		val = PyDict_GetItem(dirs, key);
              		if (val == NULL) {
              			PyErr_SetString(PyExc_ValueError,
              					"expected a value, found none");
              			goto bail;
              		}
              		if (--PyInt_AS_LONG(val) <= 0 &&
              		    PyDict_DelItem(dirs, key) == -1)
              			goto bail;
              		Py_CLEAR(key);
              	}
              	ret = 0;
              bail:
              	Py_XDECREF(key);
              	return ret;
              }
              static int dirs_fromdict(PyObject *dirs, PyObject *source, char skipchar)
              {
              	PyObject *key, *value;
              	Py_ssize_t pos = 0;
              	while (PyDict_Next(source, &pos, &key, &value)) {
              		if (!PyString_Check(key)) {
              			PyErr_SetString(PyExc_TypeError, "expected string key");
              			return -1;
              		}
              		if (skipchar) {
-             			PyObject *st;
-             			if (!PyTuple_Check(value) ||
-             			    PyTuple_GET_SIZE(value) == 0) {
+             			if (!dirstate_tuple_check(value)) {
              				PyErr_SetString(PyExc_TypeError,
-             						"expected non-empty tuple");
+             						"expected a dirstate tuple");
              				return -1;
              			}
-             			st = PyTuple_GET_ITEM(value, 0);
-             			if (!PyString_Check(st) || PyString_GET_SIZE(st) == 0) {
-             				PyErr_SetString(PyExc_TypeError,
-             						"expected non-empty string "
-             						"at tuple index 0");
-             				return -1;
+             			}
-             			if (PyString_AS_STRING(st)[0] == skipchar)
+             			if (((dirstateTupleObject *)value)->state == skipchar)
              				continue;
              		}
              		if (_addpath(dirs, key) == -1)
              			return -1;
              	}
              	return 0;
              }
              static int dirs_fromiter(PyObject *dirs, PyObject *source)
              {
              	PyObject *iter, *item = NULL;
              	int ret;
              	iter = PyObject_GetIter(source);
              	if (iter == NULL)
              		return -1;
              	while ((item = PyIter_Next(iter)) != NULL) {
              		if (!PyString_Check(item)) {
              			PyErr_SetString(PyExc_TypeError, "expected string");
              			break;
              		}
              		if (_addpath(dirs, item) == -1)
              			break;
              		Py_CLEAR(item);
              	}
              	ret = PyErr_Occurred() ? -1 : 0;
              	Py_XDECREF(item);
              	return ret;
              }
              /*
               * Calculate a refcounted set of directory names for the files in a
               * dirstate.
               */
              static int dirs_init(dirsObject *self, PyObject *args)
              {
              	PyObject *dirs = NULL, *source = NULL;
              	char skipchar = 0;
              	int ret = -1;
              	self->dict = NULL;
              	if (!PyArg_ParseTuple(args, "|Oc:__init__", &source, &skipchar))
              		return -1;
              	dirs = PyDict_New();
              	if (dirs == NULL)
              		return -1;
              	if (source == NULL)
              		ret = 0;
              	else if (PyDict_Check(source))
              		ret = dirs_fromdict(dirs, source, skipchar);
              	else if (skipchar)
              		PyErr_SetString(PyExc_ValueError,
              				"skip character is only supported "
              				"with a dict source");
              	else
              		ret = dirs_fromiter(dirs, source);
              	if (ret == -1)
              		Py_XDECREF(dirs);
              	else
              		self->dict = dirs;
              	return ret;
              }
              PyObject *dirs_addpath(dirsObject *self, PyObject *args)
              {
              	PyObject *path;
              	if (!PyArg_ParseTuple(args, "O!:addpath", &PyString_Type, &path))
              		return NULL;
              	if (_addpath(self->dict, path) == -1)
              		return NULL;
              	Py_RETURN_NONE;
              }
              static PyObject *dirs_delpath(dirsObject *self, PyObject *args)
              {
              	PyObject *path;
              	if (!PyArg_ParseTuple(args, "O!:delpath", &PyString_Type, &path))
              		return NULL;
              	if (_delpath(self->dict, path) == -1)
              		return NULL;
              	Py_RETURN_NONE;
              }
              static int dirs_contains(dirsObject *self, PyObject *value)
              {
              	return PyString_Check(value) ? PyDict_Contains(self->dict, value) : 0;
              }
              static void dirs_dealloc(dirsObject *self)
              {
              	Py_XDECREF(self->dict);
              	PyObject_Del(self);
              }
              static PyObject *dirs_iter(dirsObject *self)
              {
              	return PyObject_GetIter(self->dict);
              }
              static PySequenceMethods dirs_sequence_methods;
              static PyMethodDef dirs_methods[] = {
              	{"addpath", (PyCFunction)dirs_addpath, METH_VARARGS, "add a path"},
              	{"delpath", (PyCFunction)dirs_delpath, METH_VARARGS, "remove a path"},
              	{NULL} /* Sentinel */
              };
              static PyTypeObject dirsType = { PyObject_HEAD_INIT(NULL) };
              void dirs_module_init(PyObject *mod)
              {
              	dirs_sequence_methods.sq_contains = (objobjproc)dirs_contains;
              	dirsType.tp_name = "parsers.dirs";
              	dirsType.tp_new = PyType_GenericNew;
              	dirsType.tp_basicsize = sizeof(dirsObject);
              	dirsType.tp_dealloc = (destructor)dirs_dealloc;
              	dirsType.tp_as_sequence = &dirs_sequence_methods;
              	dirsType.tp_flags = Py_TPFLAGS_DEFAULT;
              	dirsType.tp_doc = "dirs";
              	dirsType.tp_iter = (getiterfunc)dirs_iter;
              	dirsType.tp_methods = dirs_methods;
              	dirsType.tp_init = (initproc)dirs_init;
              	if (PyType_Ready(&dirsType) < 0)
              		return;
              	Py_INCREF(&dirsType);
              	PyModule_AddObject(mod, "dirs", (PyObject *)&dirsType);
              }

mercurial/dirstate.py

0 +1 -3

              # dirstate.py - working directory tracking for mercurial
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from node import nullid
              from i18n import _
              import scmutil, util, ignore, osutil, parsers, encoding, pathutil
              import os, stat, errno, gc
              propertycache = util.propertycache
              filecache = scmutil.filecache
              _rangemask = 0x7fffffff
-             def dirstatetuple(*x):
-                 # x is a tuple
-                 return x
+             dirstatetuple = parsers.dirstatetuple
              class repocache(filecache):
                  """filecache for files in .hg/"""
                  def join(self, obj, fname):
                      return obj._opener.join(fname)
              class rootcache(filecache):
                  """filecache for files in the repository root"""
                  def join(self, obj, fname):
                      return obj._join(fname)
              class dirstate(object):
                  def __init__(self, opener, ui, root, validate):
                      '''Create a new dirstate object.
                      opener is an open()-like callable that can be used to open the
                      dirstate file; root is the root of the directory tracked by
                      the dirstate.
                      '''
                      self._opener = opener
                      self._validate = validate
                      self._root = root
                      self._rootdir = os.path.join(root, '')
                      self._dirty = False
                      self._dirtypl = False
                      self._lastnormaltime = 0
                      self._ui = ui
                      self._filecache = {}
                  @propertycache
                  def _map(self):
                      '''Return the dirstate contents as a map from filename to
                      (state, mode, size, time).'''
                      self._read()
                      return self._map
                  @propertycache
                  def _copymap(self):
                      self._read()
                      return self._copymap
                  @propertycache
                  def _foldmap(self):
                      f = {}
                      for name, s in self._map.iteritems():
                          if s[0] != 'r':
                              f[util.normcase(name)] = name
                      for name in self._dirs:
                          f[util.normcase(name)] = name
                      f['.'] = '.' # prevents useless util.fspath() invocation
                      return f
                  @repocache('branch')
                  def _branch(self):
                      try:
                          return self._opener.read("branch").strip() or "default"
                      except IOError, inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          return "default"
                  @propertycache
                  def _pl(self):
                      try:
                          fp = self._opener("dirstate")
                          st = fp.read(40)
                          fp.close()
                          l = len(st)
                          if l == 40:
                              return st[:20], st[20:40]
                          elif l > 0 and l < 40:
                              raise util.Abort(_('working directory state appears damaged!'))
                      except IOError, err:
                          if err.errno != errno.ENOENT:
                              raise
                      return [nullid, nullid]
                  @propertycache
                  def _dirs(self):
                      return scmutil.dirs(self._map, 'r')
                  def dirs(self):
                      return self._dirs
                  @rootcache('.hgignore')
                  def _ignore(self):
                      files = [self._join('.hgignore')]
                      for name, path in self._ui.configitems("ui"):
                          if name == 'ignore' or name.startswith('ignore.'):
                              files.append(util.expandpath(path))
                      return ignore.ignore(self._root, files, self._ui.warn)
                  @propertycache
                  def _slash(self):
                      return self._ui.configbool('ui', 'slash') and os.sep != '/'
                  @propertycache
                  def _checklink(self):
                      return util.checklink(self._root)
                  @propertycache
                  def _checkexec(self):
                      return util.checkexec(self._root)
                  @propertycache
                  def _checkcase(self):
                      return not util.checkcase(self._join('.hg'))
                  def _join(self, f):
                      # much faster than os.path.join()
                      # it's safe because f is always a relative path
                      return self._rootdir + f
                  def flagfunc(self, buildfallback):
                      if self._checklink and self._checkexec:
                          def f(x):
                              try:
                                  st = os.lstat(self._join(x))
                                  if util.statislink(st):
                                      return 'l'
                                  if util.statisexec(st):
                                      return 'x'
                              except OSError:
                                  pass
                              return ''
                          return f
                      fallback = buildfallback()
                      if self._checklink:
                          def f(x):
                              if os.path.islink(self._join(x)):
                                  return 'l'
                              if 'x' in fallback(x):
                                  return 'x'
                              return ''
                          return f
                      if self._checkexec:
                          def f(x):
                              if 'l' in fallback(x):
                                  return 'l'
                              if util.isexec(self._join(x)):
                                  return 'x'
                              return ''
                          return f
                      else:
                          return fallback
                  @propertycache
                  def _cwd(self):
                      return os.getcwd()
                  def getcwd(self):
                      cwd = self._cwd
                      if cwd == self._root:
                          return ''
                      # self._root ends with a path separator if self._root is '/' or 'C:\'
                      rootsep = self._root
                      if not util.endswithsep(rootsep):
                          rootsep += os.sep
                      if cwd.startswith(rootsep):
                          return cwd[len(rootsep):]
                      else:
                          # we're outside the repo. return an absolute path.
                          return cwd
                  def pathto(self, f, cwd=None):
                      if cwd is None:
                          cwd = self.getcwd()
                      path = util.pathto(self._root, cwd, f)
                      if self._slash:
                          return util.pconvert(path)
                      return path
                  def __getitem__(self, key):
                      '''Return the current state of key (a filename) in the dirstate.
                      States are:
                        n  normal
                        m  needs merging
                        r  marked for removal
                        a  marked for addition
                        ?  not tracked
                      '''
                      return self._map.get(key, ("?",))[0]
                  def __contains__(self, key):
                      return key in self._map
                  def __iter__(self):
                      for x in sorted(self._map):
                          yield x
                  def iteritems(self):
                      return self._map.iteritems()
                  def parents(self):
                      return [self._validate(p) for p in self._pl]
                  def p1(self):
                      return self._validate(self._pl[0])
                  def p2(self):
                      return self._validate(self._pl[1])
                  def branch(self):
                      return encoding.tolocal(self._branch)
                  def setparents(self, p1, p2=nullid):
                      """Set dirstate parents to p1 and p2.
                      When moving from two parents to one, 'm' merged entries a
                      adjusted to normal and previous copy records discarded and
                      returned by the call.
                      See localrepo.setparents()
                      """
                      self._dirty = self._dirtypl = True
                      oldp2 = self._pl[1]
                      self._pl = p1, p2
                      copies = {}
                      if oldp2 != nullid and p2 == nullid:
                          # Discard 'm' markers when moving away from a merge state
                          for f, s in self._map.iteritems():
                              if s[0] == 'm':
                                  if f in self._copymap:
                                      copies[f] = self._copymap[f]
                                  self.normallookup(f)
                      return copies
                  def setbranch(self, branch):
                      self._branch = encoding.fromlocal(branch)
                      f = self._opener('branch', 'w', atomictemp=True)
                      try:
                          f.write(self._branch + '\n')
                          f.close()
                          # make sure filecache has the correct stat info for _branch after
                          # replacing the underlying file
                          ce = self._filecache['_branch']
                          if ce:
                              ce.refresh()
                      except: # re-raises
                          f.discard()
                          raise
                  def _read(self):
                      self._map = {}
                      self._copymap = {}
                      try:
                          st = self._opener.read("dirstate")
                      except IOError, err:
                          if err.errno != errno.ENOENT:
                              raise
                          return
                      if not st:
                          return
                      # Python's garbage collector triggers a GC each time a certain number
                      # of container objects (the number being defined by
                      # gc.get_threshold()) are allocated. parse_dirstate creates a tuple
                      # for each file in the dirstate. The C version then immediately marks
                      # them as not to be tracked by the collector. However, this has no
                      # effect on when GCs are triggered, only on what objects the GC looks
                      # into. This means that O(number of files) GCs are unavoidable.
                      # Depending on when in the process's lifetime the dirstate is parsed,
                      # this can get very expensive. As a workaround, disable GC while
                      # parsing the dirstate.
                      gcenabled = gc.isenabled()
                      gc.disable()
                      try:
                          p = parsers.parse_dirstate(self._map, self._copymap, st)
                      finally:
                          if gcenabled:
                              gc.enable()
                      if not self._dirtypl:
                          self._pl = p
                  def invalidate(self):
                      for a in ("_map", "_copymap", "_foldmap", "_branch", "_pl", "_dirs",
                              "_ignore"):
                          if a in self.__dict__:
                              delattr(self, a)
                      self._lastnormaltime = 0
                      self._dirty = False
                  def copy(self, source, dest):
                      """Mark dest as a copy of source. Unmark dest if source is None."""
                      if source == dest:
                          return
                      self._dirty = True
                      if source is not None:
                          self._copymap[dest] = source
                      elif dest in self._copymap:
                          del self._copymap[dest]
                  def copied(self, file):
                      return self._copymap.get(file, None)
                  def copies(self):
                      return self._copymap
                  def _droppath(self, f):
                      if self[f] not in "?r" and "_dirs" in self.__dict__:
                          self._dirs.delpath(f)
                  def _addpath(self, f, state, mode, size, mtime):
                      oldstate = self[f]
                      if state == 'a' or oldstate == 'r':
                          scmutil.checkfilename(f)
                          if f in self._dirs:
                              raise util.Abort(_('directory %r already in dirstate') % f)
                          # shadows
                          for d in scmutil.finddirs(f):
                              if d in self._dirs:
                                  break
                              if d in self._map and self[d] != 'r':
                                  raise util.Abort(
                                      _('file %r in dirstate clashes with %r') % (d, f))
                      if oldstate in "?r" and "_dirs" in self.__dict__:
                          self._dirs.addpath(f)
                      self._dirty = True
                      self._map[f] = dirstatetuple(state, mode, size, mtime)
                  def normal(self, f):
                      '''Mark a file normal and clean.'''
                      s = os.lstat(self._join(f))
                      mtime = int(s.st_mtime)
                      self._addpath(f, 'n', s.st_mode,
                                    s.st_size & _rangemask, mtime & _rangemask)
                      if f in self._copymap:
                          del self._copymap[f]
                      if mtime > self._lastnormaltime:
                          # Remember the most recent modification timeslot for status(),
                          # to make sure we won't miss future size-preserving file content
                          # modifications that happen within the same timeslot.
                          self._lastnormaltime = mtime
                  def normallookup(self, f):
                      '''Mark a file normal, but possibly dirty.'''
                      if self._pl[1] != nullid and f in self._map:
                          # if there is a merge going on and the file was either
                          # in state 'm' (-1) or coming from other parent (-2) before
                          # being removed, restore that state.
                          entry = self._map[f]
                          if entry[0] == 'r' and entry[2] in (-1, -2):
                              source = self._copymap.get(f)
                              if entry[2] == -1:
                                  self.merge(f)
                              elif entry[2] == -2:
                                  self.otherparent(f)
                              if source:
                                  self.copy(source, f)
                              return
                          if entry[0] == 'm' or entry[0] == 'n' and entry[2] == -2:
                              return
                      self._addpath(f, 'n', 0, -1, -1)
                      if f in self._copymap:
                          del self._copymap[f]
                  def otherparent(self, f):
                      '''Mark as coming from the other parent, always dirty.'''
                      if self._pl[1] == nullid:
                          raise util.Abort(_("setting %r to other parent "
                                             "only allowed in merges") % f)
                      self._addpath(f, 'n', 0, -2, -1)
                      if f in self._copymap:
                          del self._copymap[f]
                  def add(self, f):
                      '''Mark a file added.'''
                      self._addpath(f, 'a', 0, -1, -1)
                      if f in self._copymap:
                          del self._copymap[f]
                  def remove(self, f):
                      '''Mark a file removed.'''
                      self._dirty = True
                      self._droppath(f)
                      size = 0
                      if self._pl[1] != nullid and f in self._map:
                          # backup the previous state
                          entry = self._map[f]
                          if entry[0] == 'm': # merge
                              size = -1
                          elif entry[0] == 'n' and entry[2] == -2: # other parent
                              size = -2
                      self._map[f] = dirstatetuple('r', 0, size, 0)
                      if size == 0 and f in self._copymap:
                          del self._copymap[f]
                  def merge(self, f):
                      '''Mark a file merged.'''
                      if self._pl[1] == nullid:
                          return self.normallookup(f)
                      s = os.lstat(self._join(f))
                      self._addpath(f, 'm', s.st_mode,
                                    s.st_size & _rangemask, int(s.st_mtime) & _rangemask)
                      if f in self._copymap:
                          del self._copymap[f]
                  def drop(self, f):
                      '''Drop a file from the dirstate'''
                      if f in self._map:
                          self._dirty = True
                          self._droppath(f)
                          del self._map[f]
                  def _normalize(self, path, isknown, ignoremissing=False, exists=None):
                      normed = util.normcase(path)
                      folded = self._foldmap.get(normed, None)
                      if folded is None:
                          if isknown:
                              folded = path
                          else:
                              if exists is None:
                                  exists = os.path.lexists(os.path.join(self._root, path))
                              if not exists:
                                  # Maybe a path component exists
                                  if not ignoremissing and '/' in path:
                                      d, f = path.rsplit('/', 1)
                                      d = self._normalize(d, isknown, ignoremissing, None)
                                      folded = d + "/" + f
                                  else:
                                      # No path components, preserve original case
                                      folded = path
                              else:
                                  # recursively normalize leading directory components
                                  # against dirstate
                                  if '/' in normed:
                                      d, f = normed.rsplit('/', 1)
                                      d = self._normalize(d, isknown, ignoremissing, True)
                                      r = self._root + "/" + d
                                      folded = d + "/" + util.fspath(f, r)
                                  else:
                                      folded = util.fspath(normed, self._root)
                                  self._foldmap[normed] = folded
                      return folded
                  def normalize(self, path, isknown=False, ignoremissing=False):
                      '''
                      normalize the case of a pathname when on a casefolding filesystem
                      isknown specifies whether the filename came from walking the
                      disk, to avoid extra filesystem access.
                      If ignoremissing is True, missing path are returned
                      unchanged. Otherwise, we try harder to normalize possibly
                      existing path components.
                      The normalized case is determined based on the following precedence:
                      - version of name already stored in the dirstate
                      - version of name stored on disk
                      - version provided via command arguments
                      '''
                      if self._checkcase:
                          return self._normalize(path, isknown, ignoremissing)
                      return path
                  def clear(self):
                      self._map = {}
                      if "_dirs" in self.__dict__:
                          delattr(self, "_dirs")
                      self._copymap = {}
                      self._pl = [nullid, nullid]
                      self._lastnormaltime = 0
                      self._dirty = True
                  def rebuild(self, parent, allfiles, changedfiles=None):
                      changedfiles = changedfiles or allfiles
                      oldmap = self._map
                      self.clear()
                      for f in allfiles:
                          if f not in changedfiles:
                              self._map[f] = oldmap[f]
                          else:
                              if 'x' in allfiles.flags(f):
                                  self._map[f] = dirstatetuple('n', 0777, -1, 0)
                              else:
                                  self._map[f] = dirstatetuple('n', 0666, -1, 0)
                      self._pl = (parent, nullid)
                      self._dirty = True
                  def write(self):
                      if not self._dirty:
                          return
                      st = self._opener("dirstate", "w", atomictemp=True)
                      # use the modification time of the newly created temporary file as the
                      # filesystem's notion of 'now'
                      now = util.fstat(st).st_mtime
                      st.write(parsers.pack_dirstate(self._map, self._copymap, self._pl, now))
                      st.close()
                      self._lastnormaltime = 0
                      self._dirty = self._dirtypl = False
                  def _dirignore(self, f):
                      if f == '.':
                          return False
                      if self._ignore(f):
                          return True
                      for p in scmutil.finddirs(f):
                          if self._ignore(p):
                              return True
                      return False
                  def _walkexplicit(self, match, subrepos):
                      '''Get stat data about the files explicitly specified by match.
                      Return a triple (results, dirsfound, dirsnotfound).
                      - results is a mapping from filename to stat result. It also contains
                        listings mapping subrepos and .hg to None.
                      - dirsfound is a list of files found to be directories.
                      - dirsnotfound is a list of files that the dirstate thinks are
                        directories and that were not found.'''
                      def badtype(mode):
                          kind = _('unknown')
                          if stat.S_ISCHR(mode):
                              kind = _('character device')
                          elif stat.S_ISBLK(mode):
                              kind = _('block device')
                          elif stat.S_ISFIFO(mode):
                              kind = _('fifo')
                          elif stat.S_ISSOCK(mode):
                              kind = _('socket')
                          elif stat.S_ISDIR(mode):
                              kind = _('directory')
                          return _('unsupported file type (type is %s)') % kind
                      matchedir = match.explicitdir
                      badfn = match.bad
                      dmap = self._map
                      normpath = util.normpath
                      lstat = os.lstat
                      getkind = stat.S_IFMT
                      dirkind = stat.S_IFDIR
                      regkind = stat.S_IFREG
                      lnkkind = stat.S_IFLNK
                      join = self._join
                      dirsfound = []
                      foundadd = dirsfound.append
                      dirsnotfound = []
                      notfoundadd = dirsnotfound.append
                      if match.matchfn != match.exact and self._checkcase:
                          normalize = self._normalize
                      else:
                          normalize = None
                      files = sorted(match.files())
                      subrepos.sort()
                      i, j = 0, 0
                      while i < len(files) and j < len(subrepos):
                          subpath = subrepos[j] + "/"
                          if files[i] < subpath:
                              i += 1
                              continue
                          while i < len(files) and files[i].startswith(subpath):
                              del files[i]
                          j += 1
                      if not files or '.' in files:
                          files = ['']
                      results = dict.fromkeys(subrepos)
                      results['.hg'] = None
                      for ff in files:
                          if normalize:
                              nf = normalize(normpath(ff), False, True)
                          else:
                              nf = normpath(ff)
                          if nf in results:
                              continue
                          try:
                              st = lstat(join(nf))
                              kind = getkind(st.st_mode)
                              if kind == dirkind:
                                  if nf in dmap:
                                      # file replaced by dir on disk but still in dirstate
                                      results[nf] = None
                                  if matchedir:
                                      matchedir(nf)
                                  foundadd(nf)
                              elif kind == regkind or kind == lnkkind:
                                  results[nf] = st
                              else:
                                  badfn(ff, badtype(kind))
                                  if nf in dmap:
                                      results[nf] = None
                          except OSError, inst: # nf not found on disk - it is dirstate only
                              if nf in dmap: # does it exactly match a missing file?
                                  results[nf] = None
                              else: # does it match a missing directory?
                                  prefix = nf + "/"
                                  for fn in dmap:
                                      if fn.startswith(prefix):
                                          if matchedir:
                                              matchedir(nf)
                                          notfoundadd(nf)
                                          break
                                  else:
                                      badfn(ff, inst.strerror)
                      return results, dirsfound, dirsnotfound
                  def walk(self, match, subrepos, unknown, ignored, full=True):
                      '''
                      Walk recursively through the directory tree, finding all files
                      matched by match.
                      If full is False, maybe skip some known-clean files.
                      Return a dict mapping filename to stat-like object (either
                      mercurial.osutil.stat instance or return value of os.stat()).
                      '''
                      # full is a flag that extensions that hook into walk can use -- this
                      # implementation doesn't use it at all. This satisfies the contract
                      # because we only guarantee a "maybe".
                      if ignored:
                          ignore = util.never
                          dirignore = util.never
                      elif unknown:
                          ignore = self._ignore
                          dirignore = self._dirignore
                      else:
                          # if not unknown and not ignored, drop dir recursion and step 2
                          ignore = util.always
                          dirignore = util.always
                      matchfn = match.matchfn
                      matchalways = match.always()
                      matchtdir = match.traversedir
                      dmap = self._map
                      listdir = osutil.listdir
                      lstat = os.lstat
                      dirkind = stat.S_IFDIR
                      regkind = stat.S_IFREG
                      lnkkind = stat.S_IFLNK
                      join = self._join
                      exact = skipstep3 = False
                      if matchfn == match.exact: # match.exact
                          exact = True
                          dirignore = util.always # skip step 2
                      elif match.files() and not match.anypats(): # match.match, no patterns
                          skipstep3 = True
                      if not exact and self._checkcase:
                          normalize = self._normalize
                          skipstep3 = False
                      else:
                          normalize = None
                      # step 1: find all explicit files
                      results, work, dirsnotfound = self._walkexplicit(match, subrepos)
                      skipstep3 = skipstep3 and not (work or dirsnotfound)
                      work = [d for d in work if not dirignore(d)]
                      wadd = work.append
                      # step 2: visit subdirectories
                      while work:
                          nd = work.pop()
                          skip = None
                          if nd == '.':
                              nd = ''
                          else:
                              skip = '.hg'
                          try:
                              entries = listdir(join(nd), stat=True, skip=skip)
                          except OSError, inst:
                              if inst.errno in (errno.EACCES, errno.ENOENT):
                                  match.bad(self.pathto(nd), inst.strerror)
                                  continue
                              raise
                          for f, kind, st in entries:
                              if normalize:
                                  nf = normalize(nd and (nd + "/" + f) or f, True, True)
                              else:
                                  nf = nd and (nd + "/" + f) or f
                              if nf not in results:
                                  if kind == dirkind:
                                      if not ignore(nf):
                                          if matchtdir:
                                              matchtdir(nf)
                                          wadd(nf)
                                      if nf in dmap and (matchalways or matchfn(nf)):
                                          results[nf] = None
                                  elif kind == regkind or kind == lnkkind:
                                      if nf in dmap:
                                          if matchalways or matchfn(nf):
                                              results[nf] = st
                                      elif (matchalways or matchfn(nf)) and not ignore(nf):
                                          results[nf] = st
                                  elif nf in dmap and (matchalways or matchfn(nf)):
                                      results[nf] = None
                      for s in subrepos:
                          del results[s]
                      del results['.hg']
                      # step 3: visit remaining files from dmap
                      if not skipstep3 and not exact:
                          # If a dmap file is not in results yet, it was either
                          # a) not matching matchfn b) ignored, c) missing, or d) under a
                          # symlink directory.
                          if not results and matchalways:
                              visit = dmap.keys()
                          else:
                              visit = [f for f in dmap if f not in results and matchfn(f)]
                          visit.sort()
                          if unknown:
                              # unknown == True means we walked all dirs under the roots
                              # that wasn't ignored, and everything that matched was stat'ed
                              # and is already in results.
                              # The rest must thus be ignored or under a symlink.
                              audit_path = pathutil.pathauditor(self._root)
                              for nf in iter(visit):
                                  # Report ignored items in the dmap as long as they are not
                                  # under a symlink directory.
                                  if audit_path.check(nf):
                                      try:
                                          results[nf] = lstat(join(nf))
                                          # file was just ignored, no links, and exists
                                      except OSError:
                                          # file doesn't exist
                                          results[nf] = None
                                  else:
                                      # It's either missing or under a symlink directory
                                      # which we in this case report as missing
                                      results[nf] = None
                          else:
                              # We may not have walked the full directory tree above,
                              # so stat and check everything we missed.
                              nf = iter(visit).next
                              for st in util.statfiles([join(i) for i in visit]):
                                  results[nf()] = st
                      return results
                  def status(self, match, subrepos, ignored, clean, unknown):
                      '''Determine the status of the working copy relative to the
                      dirstate and return a tuple of lists (unsure, modified, added,
                      removed, deleted, unknown, ignored, clean), where:
                        unsure:
                          files that might have been modified since the dirstate was
                          written, but need to be read to be sure (size is the same
                          but mtime differs)
                        modified:
                          files that have definitely been modified since the dirstate
                          was written (different size or mode)
                        added:
                          files that have been explicitly added with hg add
                        removed:
                          files that have been explicitly removed with hg remove
                        deleted:
                          files that have been deleted through other means ("missing")
                        unknown:
                          files not in the dirstate that are not ignored
                        ignored:
                          files not in the dirstate that are ignored
                          (by _dirignore())
                        clean:
                          files that have definitely not been modified since the
                          dirstate was written
                      '''
                      listignored, listclean, listunknown = ignored, clean, unknown
                      lookup, modified, added, unknown, ignored = [], [], [], [], []
                      removed, deleted, clean = [], [], []
                      dmap = self._map
                      ladd = lookup.append            # aka "unsure"
                      madd = modified.append
                      aadd = added.append
                      uadd = unknown.append
                      iadd = ignored.append
                      radd = removed.append
                      dadd = deleted.append
                      cadd = clean.append
                      mexact = match.exact
                      dirignore = self._dirignore
                      checkexec = self._checkexec
                      copymap = self._copymap
                      lastnormaltime = self._lastnormaltime
                      # We need to do full walks when either
                      # - we're listing all clean files, or
                      # - match.traversedir does something, because match.traversedir should
                      #   be called for every dir in the working dir
                      full = listclean or match.traversedir is not None
                      for fn, st in self.walk(match, subrepos, listunknown, listignored,
                                              full=full).iteritems():
                          if fn not in dmap:
                              if (listignored or mexact(fn)) and dirignore(fn):
                                  if listignored:
                                      iadd(fn)
                              else:
                                  uadd(fn)
                              continue
                          state, mode, size, time = dmap[fn]
                          if not st and state in "nma":
                              dadd(fn)
                          elif state == 'n':
                              mtime = int(st.st_mtime)
                              if (size >= 0 and
                                  ((size != st.st_size and size != st.st_size & _rangemask)
                                   or ((mode ^ st.st_mode) & 0100 and checkexec))
                                  or size == -2 # other parent
                                  or fn in copymap):
                                  madd(fn)
                              elif time != mtime and time != mtime & _rangemask:
                                  ladd(fn)
                              elif mtime == lastnormaltime:
                                  # fn may have been changed in the same timeslot without
                                  # changing its size. This can happen if we quickly do
                                  # multiple commits in a single transaction.
                                  # Force lookup, so we don't miss such a racy file change.
                                  ladd(fn)
                              elif listclean:
                                  cadd(fn)
                          elif state == 'm':
                              madd(fn)
                          elif state == 'a':
                              aadd(fn)
                          elif state == 'r':
                              radd(fn)
                      return (lookup, modified, added, removed, deleted, unknown, ignored,
                              clean)

mercurial/parsers.c

0 +139 -25

              /*
               parsers.c - efficient content parsing
               Copyright 2008 Matt Mackall <mpm@selenic.com> and others
               This software may be used and distributed according to the terms of
               the GNU General Public License, incorporated herein by reference.
              */
              #include <Python.h>
              #include <ctype.h>
              #include <stddef.h>
              #include <string.h>
              #include "util.h"
              static char *versionerrortext = "Python minor version mismatch";
              static int8_t hextable[256] = {
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
 ,  1,  2,  3,  4,  5,  6,  7,  8,  9, -1, -1, -1, -1, -1, -1, /* 0-9 */
              	-1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, /* A-F */
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, /* a-f */
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
              	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1
              };
              static inline int hexdigit(const char *p, Py_ssize_t off)
              {
              	int8_t val = hextable[(unsigned char)p[off]];
              	if (val >= 0) {
              		return val;
              	}
              	PyErr_SetString(PyExc_ValueError, "input contains non-hex character");
              	return 0;
              }
              /*
               * Turn a hex-encoded string into binary.
               */
              static PyObject *unhexlify(const char *str, int len)
              {
              	PyObject *ret;
              	char *d;
              	int i;
              	ret = PyBytes_FromStringAndSize(NULL, len / 2);
              	if (!ret)
              		return NULL;
              	d = PyBytes_AsString(ret);
              	for (i = 0; i < len;) {
              		int hi = hexdigit(str, i++);
              		int lo = hexdigit(str, i++);
              		*d++ = (hi << 4) | lo;
              	}
              	return ret;
              }
              /*
               * This code assumes that a manifest is stitched together with newline
               * ('\n') characters.
               */
              static PyObject *parse_manifest(PyObject *self, PyObject *args)
              {
              	PyObject *mfdict, *fdict;
              	char *str, *start, *end;
              	int len;
              	if (!PyArg_ParseTuple(args, "O!O!s#:parse_manifest",
              			      &PyDict_Type, &mfdict,
              			      &PyDict_Type, &fdict,
              			      &str, &len))
              		goto quit;
              	start = str;
              	end = str + len;
              	while (start < end) {
              		PyObject *file = NULL, *node = NULL;
              		PyObject *flags = NULL;
              		char *zero = NULL, *newline = NULL;
              		ptrdiff_t nlen;
              		zero = memchr(start, '\0', end - start);
              		if (!zero) {
              			PyErr_SetString(PyExc_ValueError,
              					"manifest entry has no separator");
              			goto quit;
              		}
              		newline = memchr(zero + 1, '\n', end - (zero + 1));
              		if (!newline) {
              			PyErr_SetString(PyExc_ValueError,
              					"manifest contains trailing garbage");
              			goto quit;
              		}
              		file = PyBytes_FromStringAndSize(start, zero - start);
              		if (!file)
              			goto bail;
              		nlen = newline - zero - 1;
              		node = unhexlify(zero + 1, nlen > 40 ? 40 : (int)nlen);
              		if (!node)
              			goto bail;
              		if (nlen > 40) {
              			flags = PyBytes_FromStringAndSize(zero + 41,
              							   nlen - 40);
              			if (!flags)
              				goto bail;
              			if (PyDict_SetItem(fdict, file, flags) == -1)
              				goto bail;
              		}
              		if (PyDict_SetItem(mfdict, file, node) == -1)
              			goto bail;
              		start = newline + 1;
              		Py_XDECREF(flags);
              		Py_XDECREF(node);
              		Py_XDECREF(file);
              		continue;
              	bail:
              		Py_XDECREF(flags);
              		Py_XDECREF(node);
              		Py_XDECREF(file);
              		goto quit;
              	}
              	Py_INCREF(Py_None);
              	return Py_None;
              quit:
              	return NULL;
              }
+             static inline dirstateTupleObject *make_dirstate_tuple(char state, int mode,
+             						       int size, int mtime)
+             {
+             	dirstateTupleObject *t = PyObject_New(dirstateTupleObject,
+             					      &dirstateTupleType);
+             	if (!t)
+             		return NULL;
+             	t->state = state;
+             	t->mode = mode;
+             	t->size = size;
+             	t->mtime = mtime;
+             	return t;
+             }
+             static PyObject *dirstate_tuple_new(PyTypeObject *subtype, PyObject *args,
+             				    PyObject *kwds)
+             {
+             	/* We do all the initialization here and not a tp_init function because
+             	 * dirstate_tuple is immutable. */
+             	dirstateTupleObject *t;
+             	char state;
+             	int size, mode, mtime;
+             	if (!PyArg_ParseTuple(args, "ciii", &state, &mode, &size, &mtime))
+             		return NULL;
+             	t = (dirstateTupleObject *)subtype->tp_alloc(subtype, 1);
+             	if (!t)
+             		return NULL;
+             	t->state = state;
+             	t->mode = mode;
+             	t->size = size;
+             	t->mtime = mtime;
+             	return (PyObject *)t;
+             }
+             static void dirstate_tuple_dealloc(PyObject *o)
+             {
+             	PyObject_Del(o);
+             }
+             static Py_ssize_t dirstate_tuple_length(PyObject *o)
+             {
+             	return 4;
+             }
+             static PyObject *dirstate_tuple_item(PyObject *o, Py_ssize_t i)
+             {
+             	dirstateTupleObject *t = (dirstateTupleObject *)o;
+             	switch (i) {
+             	case 0:
+             		return PyBytes_FromStringAndSize(&t->state, 1);
+             	case 1:
+             		return PyInt_FromLong(t->mode);
+             	case 2:
+             		return PyInt_FromLong(t->size);
+             	case 3:
+             		return PyInt_FromLong(t->mtime);
+             	default:
+             		PyErr_SetString(PyExc_IndexError, "index out of range");
+             		return NULL;
+             	}
+             }
+             static PySequenceMethods dirstate_tuple_sq = {
+             	dirstate_tuple_length,     /* sq_length */
+,                         /* sq_concat */
+,                         /* sq_repeat */
+             	dirstate_tuple_item,       /* sq_item */
+,                         /* sq_ass_item */
+,                         /* sq_contains */
+,                         /* sq_inplace_concat */
+/* sq_inplace_repeat */
+             };
+             PyTypeObject dirstateTupleType = {
+             	PyVarObject_HEAD_INIT(NULL, 0)
+             	"dirstate_tuple",          /* tp_name */
+             	sizeof(dirstateTupleObject),/* tp_basicsize */
+,                         /* tp_itemsize */
+             	(destructor)dirstate_tuple_dealloc, /* tp_dealloc */
+,                         /* tp_print */
+,                         /* tp_getattr */
+,                         /* tp_setattr */
+,                         /* tp_compare */
+,                         /* tp_repr */
+,                         /* tp_as_number */
+             	&dirstate_tuple_sq,        /* tp_as_sequence */
+,                         /* tp_as_mapping */
+,                         /* tp_hash  */
+,                         /* tp_call */
+,                         /* tp_str */
+,                         /* tp_getattro */
+,                         /* tp_setattro */
+,                         /* tp_as_buffer */
+             	Py_TPFLAGS_DEFAULT,        /* tp_flags */
+             	"dirstate tuple",          /* tp_doc */
+,                         /* tp_traverse */
+,                         /* tp_clear */
+,                         /* tp_richcompare */
+,                         /* tp_weaklistoffset */
+,                         /* tp_iter */
+,                         /* tp_iternext */
+,                         /* tp_methods */
+,                         /* tp_members */
+,                         /* tp_getset */
+,                         /* tp_base */
+,                         /* tp_dict */
+,                         /* tp_descr_get */
+,                         /* tp_descr_set */
+,                         /* tp_dictoffset */
+,                         /* tp_init */
+,                         /* tp_alloc */
+             	dirstate_tuple_new,        /* tp_new */
+             };
              static PyObject *parse_dirstate(PyObject *self, PyObject *args)
              {
              	PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
              	PyObject *fname = NULL, *cname = NULL, *entry = NULL;
              	char state, *cur, *str, *cpos;
              	int mode, size, mtime;
              	unsigned int flen;
              	int len, pos = 40;
              	if (!PyArg_ParseTuple(args, "O!O!s#:parse_dirstate",
              			      &PyDict_Type, &dmap,
              			      &PyDict_Type, &cmap,
              			      &str, &len))
              		goto quit;
              	/* read parents */
              	if (len < 40)
              		goto quit;
              	parents = Py_BuildValue("s#s#", str, 20, str + 20, 20);
              	if (!parents)
              		goto quit;
              	/* read filenames */
              	while (pos >= 40 && pos < len) {
              		cur = str + pos;
              		/* unpack header */
              		state = *cur;
              		mode = getbe32(cur + 1);
              		size = getbe32(cur + 5);
              		mtime = getbe32(cur + 9);
              		flen = getbe32(cur + 13);
              		pos += 17;
              		cur += 17;
              		if (flen > len - pos) {
              			PyErr_SetString(PyExc_ValueError, "overflow in dirstate");
              			goto quit;
              		}
-             		entry = Py_BuildValue("ciii", state, mode, size, mtime);
-             		if (!entry)
-             			goto quit;
-             		PyObject_GC_UnTrack(entry); /* don't waste time with this */
+             		entry = (PyObject *)make_dirstate_tuple(state, mode, size,
+             							mtime);
              		cpos = memchr(cur, 0, flen);
              		if (cpos) {
              			fname = PyBytes_FromStringAndSize(cur, cpos - cur);
              			cname = PyBytes_FromStringAndSize(cpos + 1,
              							   flen - (cpos - cur) - 1);
              			if (!fname || !cname ||
              			    PyDict_SetItem(cmap, fname, cname) == -1 ||
              			    PyDict_SetItem(dmap, fname, entry) == -1)
              				goto quit;
              			Py_DECREF(cname);
              		} else {
              			fname = PyBytes_FromStringAndSize(cur, flen);
              			if (!fname ||
              			    PyDict_SetItem(dmap, fname, entry) == -1)
              				goto quit;
              		}
              		Py_DECREF(fname);
              		Py_DECREF(entry);
              		fname = cname = entry = NULL;
              		pos += flen;
              	}
              	ret = parents;
              	Py_INCREF(ret);
              quit:
              	Py_XDECREF(fname);
              	Py_XDECREF(cname);
              	Py_XDECREF(entry);
              	Py_XDECREF(parents);
              	return ret;
              }
              static inline int getintat(PyObject *tuple, int off, uint32_t *v)
              {
              	PyObject *o = PyTuple_GET_ITEM(tuple, off);
              	long val;
              	if (PyInt_Check(o))
              		val = PyInt_AS_LONG(o);
              	else if (PyLong_Check(o)) {
              		val = PyLong_AsLong(o);
              		if (val == -1 && PyErr_Occurred())
              			return -1;
              	} else {
              		PyErr_SetString(PyExc_TypeError, "expected an int or long");
              		return -1;
              	}
              	if (LONG_MAX > INT_MAX && (val > INT_MAX || val < INT_MIN)) {
              		PyErr_SetString(PyExc_OverflowError,
              				"Python value to large to convert to uint32_t");
              		return -1;
              	}
              	*v = (uint32_t)val;
              	return 0;
              }
              /*
               * Efficiently pack a dirstate object into its on-disk format.
               */
              static PyObject *pack_dirstate(PyObject *self, PyObject *args)
              {
              	PyObject *packobj = NULL;
              	PyObject *map, *copymap, *pl, *mtime_unset = NULL;
              	Py_ssize_t nbytes, pos, l;
              	PyObject *k, *v, *pn;
              	char *p, *s;
              	double now;
              	if (!PyArg_ParseTuple(args, "O!O!Od:pack_dirstate",
              			      &PyDict_Type, &map, &PyDict_Type, &copymap,
              			      &pl, &now))
              		return NULL;
              	if (!PySequence_Check(pl) || PySequence_Size(pl) != 2) {
              		PyErr_SetString(PyExc_TypeError, "expected 2-element sequence");
              		return NULL;
              	}
              	/* Figure out how much we need to allocate. */
              	for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
              		PyObject *c;
              		if (!PyString_Check(k)) {
              			PyErr_SetString(PyExc_TypeError, "expected string key");
              			goto bail;
              		}
              		nbytes += PyString_GET_SIZE(k) + 17;
              		c = PyDict_GetItem(copymap, k);
              		if (c) {
              			if (!PyString_Check(c)) {
              				PyErr_SetString(PyExc_TypeError,
              						"expected string key");
              				goto bail;
              			}
              			nbytes += PyString_GET_SIZE(c) + 1;
              		}
              	}
              	packobj = PyString_FromStringAndSize(NULL, nbytes);
              	if (packobj == NULL)
              		goto bail;
              	p = PyString_AS_STRING(packobj);
              	pn = PySequence_ITEM(pl, 0);
              	if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
              		PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
              		goto bail;
              	}
              	memcpy(p, s, l);
              	p += 20;
              	pn = PySequence_ITEM(pl, 1);
              	if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
              		PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
              		goto bail;
              	}
              	memcpy(p, s, l);
              	p += 20;
              	for (pos = 0; PyDict_Next(map, &pos, &k, &v); ) {
+             		dirstateTupleObject *tuple;
+             		char state;
              		uint32_t mode, size, mtime;
              		Py_ssize_t len, l;
              		PyObject *o;
-             		char *s, *t;
+             		char *t;
-             		if (!PyTuple_Check(v) || PyTuple_GET_SIZE(v) != 4) {
-             			PyErr_SetString(PyExc_TypeError, "expected a 4-tuple");
+             		if (!dirstate_tuple_check(v)) {
+             			PyErr_SetString(PyExc_TypeError,
+             					"expected a dirstate tuple");
              			goto bail;
              		}
-             		o = PyTuple_GET_ITEM(v, 0);
-             		if (PyString_AsStringAndSize(o, &s, &l) == -1 || l != 1) {
-             			PyErr_SetString(PyExc_TypeError, "expected one byte");
-             			goto bail;
+             		}
-             		*p++ = *s;
-             		if (getintat(v, 1, &mode) == -1)
-             			goto bail;
-             		if (getintat(v, 2, &size) == -1)
-             			goto bail;
-             		if (getintat(v, 3, &mtime) == -1)
-             			goto bail;
-             		if (*s == 'n' && mtime == (uint32_t)now) {
+             		tuple = (dirstateTupleObject *)v;
+             		state = tuple->state;
+             		mode = tuple->mode;
+             		size = tuple->size;
+             		mtime = tuple->mtime;
+             		if (state == 'n' && mtime == (uint32_t)now) {
              			/* See pure/parsers.py:pack_dirstate for why we do
              			 * this. */
              			mtime = -1;
-             			mtime_unset = Py_BuildValue(
-             				"ciii", *s, mode, size, mtime);
+             			mtime_unset = (PyObject *)make_dirstate_tuple(
+             				state, mode, size, mtime);
              			if (!mtime_unset)
              				goto bail;
              			if (PyDict_SetItem(map, k, mtime_unset) == -1)
              				goto bail;
              			Py_DECREF(mtime_unset);
              			mtime_unset = NULL;
              		}
+             		*p++ = state;
              		putbe32(mode, p);
              		putbe32(size, p + 4);
              		putbe32(mtime, p + 8);
              		t = p + 12;
              		p += 16;
              		len = PyString_GET_SIZE(k);
              		memcpy(p, PyString_AS_STRING(k), len);
              		p += len;
              		o = PyDict_GetItem(copymap, k);
              		if (o) {
              			*p++ = '\0';
              			l = PyString_GET_SIZE(o);
              			memcpy(p, PyString_AS_STRING(o), l);
              			p += l;
              			len += l + 1;
              		}
              		putbe32((uint32_t)len, t);
              	}
              	pos = p - PyString_AS_STRING(packobj);
              	if (pos != nbytes) {
              		PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
                                           (long)pos, (long)nbytes);
              		goto bail;
              	}
              	return packobj;
              bail:
              	Py_XDECREF(mtime_unset);
              	Py_XDECREF(packobj);
              	return NULL;
              }
              /*
               * A base-16 trie for fast node->rev mapping.
               *
               * Positive value is index of the next node in the trie
               * Negative value is a leaf: -(rev + 1)
               * Zero is empty
               */
              typedef struct {
              	int children[16];
              } nodetree;
              /*
               * This class has two behaviours.
               *
               * When used in a list-like way (with integer keys), we decode an
               * entry in a RevlogNG index file on demand. Our last entry is a
               * sentinel, always a nullid.  We have limited support for
               * integer-keyed insert and delete, only at elements right before the
               * sentinel.
               *
               * With string keys, we lazily perform a reverse mapping from node to
               * rev, using a base-16 trie.
               */
              typedef struct {
              	PyObject_HEAD
              	/* Type-specific fields go here. */
              	PyObject *data;        /* raw bytes of index */
              	PyObject **cache;      /* cached tuples */
              	const char **offsets;  /* populated on demand */
              	Py_ssize_t raw_length; /* original number of elements */
              	Py_ssize_t length;     /* current number of elements */
              	PyObject *added;       /* populated on demand */
              	PyObject *headrevs;    /* cache, invalidated on changes */
              	nodetree *nt;          /* base-16 trie */
              	int ntlength;          /* # nodes in use */
              	int ntcapacity;        /* # nodes allocated */
              	int ntdepth;           /* maximum depth of tree */
              	int ntsplits;          /* # splits performed */
              	int ntrev;             /* last rev scanned */
              	int ntlookups;         /* # lookups */
              	int ntmisses;          /* # lookups that miss the cache */
              	int inlined;
              } indexObject;
              static Py_ssize_t index_length(const indexObject *self)
              {
              	if (self->added == NULL)
              		return self->length;
              	return self->length + PyList_GET_SIZE(self->added);
              }
              static PyObject *nullentry;
              static const char nullid[20];
              static long inline_scan(indexObject *self, const char **offsets);
              #if LONG_MAX == 0x7fffffffL
              static char *tuple_format = "Kiiiiiis#";
              #else
              static char *tuple_format = "kiiiiiis#";
              #endif
              /* A RevlogNG v1 index entry is 64 bytes long. */
              static const long v1_hdrsize = 64;
              /*
               * Return a pointer to the beginning of a RevlogNG record.
               */
              static const char *index_deref(indexObject *self, Py_ssize_t pos)
              {
              	if (self->inlined && pos > 0) {
              		if (self->offsets == NULL) {
              			self->offsets = malloc(self->raw_length *
              					       sizeof(*self->offsets));
              			if (self->offsets == NULL)
              				return (const char *)PyErr_NoMemory();
              			inline_scan(self, self->offsets);
              		}
              		return self->offsets[pos];
              	}
              	return PyString_AS_STRING(self->data) + pos * v1_hdrsize;
              }
              /*
               * RevlogNG format (all in big endian, data may be inlined):
               *    6 bytes: offset
               *    2 bytes: flags
               *    4 bytes: compressed length
               *    4 bytes: uncompressed length
               *    4 bytes: base revision
               *    4 bytes: link revision
               *    4 bytes: parent 1 revision
               *    4 bytes: parent 2 revision
               *   32 bytes: nodeid (only 20 bytes used)
               */
              static PyObject *index_get(indexObject *self, Py_ssize_t pos)
              {
              	uint64_t offset_flags;
              	int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
              	const char *c_node_id;
              	const char *data;
              	Py_ssize_t length = index_length(self);
              	PyObject *entry;
              	if (pos < 0)
              		pos += length;
              	if (pos < 0 || pos >= length) {
              		PyErr_SetString(PyExc_IndexError, "revlog index out of range");
              		return NULL;
              	}
              	if (pos == length - 1) {
              		Py_INCREF(nullentry);
              		return nullentry;
              	}
              	if (pos >= self->length - 1) {
              		PyObject *obj;
              		obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
              		Py_INCREF(obj);
              		return obj;
              	}
              	if (self->cache) {
              		if (self->cache[pos]) {
              			Py_INCREF(self->cache[pos]);
              			return self->cache[pos];
              		}
              	} else {
              		self->cache = calloc(self->raw_length, sizeof(PyObject *));
              		if (self->cache == NULL)
              			return PyErr_NoMemory();
              	}
              	data = index_deref(self, pos);
              	if (data == NULL)
              		return NULL;
              	offset_flags = getbe32(data + 4);
              	if (pos == 0) /* mask out version number for the first entry */
              		offset_flags &= 0xFFFF;
              	else {
              		uint32_t offset_high = getbe32(data);
              		offset_flags |= ((uint64_t)offset_high) << 32;
              	}
              	comp_len = getbe32(data + 8);
              	uncomp_len = getbe32(data + 12);
              	base_rev = getbe32(data + 16);
              	link_rev = getbe32(data + 20);
              	parent_1 = getbe32(data + 24);
              	parent_2 = getbe32(data + 28);
              	c_node_id = data + 32;
              	entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
              			      uncomp_len, base_rev, link_rev,
              			      parent_1, parent_2, c_node_id, 20);
              	if (entry) {
              		PyObject_GC_UnTrack(entry);
              		Py_INCREF(entry);
              	}
              	self->cache[pos] = entry;
              	return entry;
              }
              /*
               * Return the 20-byte SHA of the node corresponding to the given rev.
               */
              static const char *index_node(indexObject *self, Py_ssize_t pos)
              {
              	Py_ssize_t length = index_length(self);
              	const char *data;
              	if (pos == length - 1 || pos == INT_MAX)
              		return nullid;
              	if (pos >= length)
              		return NULL;
              	if (pos >= self->length - 1) {
              		PyObject *tuple, *str;
              		tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
              		str = PyTuple_GetItem(tuple, 7);
              		return str ? PyString_AS_STRING(str) : NULL;
              	}
              	data = index_deref(self, pos);
              	return data ? data + 32 : NULL;
              }
              static int nt_insert(indexObject *self, const char *node, int rev);
              static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
              {
              	if (PyString_AsStringAndSize(obj, node, nodelen) == -1)
              		return -1;
              	if (*nodelen == 20)
              		return 0;
              	PyErr_SetString(PyExc_ValueError, "20-byte hash required");
              	return -1;
              }
              static PyObject *index_insert(indexObject *self, PyObject *args)
              {
              	PyObject *obj;
              	char *node;
              	long offset;
              	Py_ssize_t len, nodelen;
              	if (!PyArg_ParseTuple(args, "lO", &offset, &obj))
              		return NULL;
              	if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
              		PyErr_SetString(PyExc_TypeError, "8-tuple required");
              		return NULL;
              	}
              	if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
              		return NULL;
              	len = index_length(self);
              	if (offset < 0)
              		offset += len;
              	if (offset != len - 1) {
              		PyErr_SetString(PyExc_IndexError,
              				"insert only supported at index -1");
              		return NULL;
              	}
              	if (offset > INT_MAX) {
              		PyErr_SetString(PyExc_ValueError,
              				"currently only 2**31 revs supported");
              		return NULL;
              	}
              	if (self->added == NULL) {
              		self->added = PyList_New(0);
              		if (self->added == NULL)
              			return NULL;
              	}
              	if (PyList_Append(self->added, obj) == -1)
              		return NULL;
              	if (self->nt)
              		nt_insert(self, node, (int)offset);
              	Py_CLEAR(self->headrevs);
              	Py_RETURN_NONE;
              }
              static void _index_clearcaches(indexObject *self)
              {
              	if (self->cache) {
              		Py_ssize_t i;
              		for (i = 0; i < self->raw_length; i++)
              			Py_CLEAR(self->cache[i]);
              		free(self->cache);
              		self->cache = NULL;
              	}
              	if (self->offsets) {
              		free(self->offsets);
              		self->offsets = NULL;
              	}
              	if (self->nt) {
              		free(self->nt);
              		self->nt = NULL;
              	}
              	Py_CLEAR(self->headrevs);
              }
              static PyObject *index_clearcaches(indexObject *self)
              {
              	_index_clearcaches(self);
              	self->ntlength = self->ntcapacity = 0;
              	self->ntdepth = self->ntsplits = 0;
              	self->ntrev = -1;
              	self->ntlookups = self->ntmisses = 0;
              	Py_RETURN_NONE;
              }
              static PyObject *index_stats(indexObject *self)
              {
              	PyObject *obj = PyDict_New();
              	if (obj == NULL)
              		return NULL;
              #define istat(__n, __d) \
              	if (PyDict_SetItemString(obj, __d, PyInt_FromSsize_t(self->__n)) == -1) \
              		goto bail;
              	if (self->added) {
              		Py_ssize_t len = PyList_GET_SIZE(self->added);
              		if (PyDict_SetItemString(obj, "index entries added",
              					 PyInt_FromSsize_t(len)) == -1)
              			goto bail;
              	}
              	if (self->raw_length != self->length - 1)
              		istat(raw_length, "revs on disk");
              	istat(length, "revs in memory");
              	istat(ntcapacity, "node trie capacity");
              	istat(ntdepth, "node trie depth");
              	istat(ntlength, "node trie count");
              	istat(ntlookups, "node trie lookups");
              	istat(ntmisses, "node trie misses");
              	istat(ntrev, "node trie last rev scanned");
              	istat(ntsplits, "node trie splits");
              #undef istat
              	return obj;
              bail:
              	Py_XDECREF(obj);
              	return NULL;
              }
              /*
               * When we cache a list, we want to be sure the caller can't mutate
               * the cached copy.
               */
              static PyObject *list_copy(PyObject *list)
              {
              	Py_ssize_t len = PyList_GET_SIZE(list);
              	PyObject *newlist = PyList_New(len);
              	Py_ssize_t i;
              	if (newlist == NULL)
              		return NULL;
              	for (i = 0; i < len; i++) {
              		PyObject *obj = PyList_GET_ITEM(list, i);
              		Py_INCREF(obj);
              		PyList_SET_ITEM(newlist, i, obj);
              	}
              	return newlist;
              }
              static PyObject *index_headrevs(indexObject *self)
              {
              	Py_ssize_t i, len, addlen;
              	char *nothead = NULL;
              	PyObject *heads;
              	if (self->headrevs)
              		return list_copy(self->headrevs);
              	len = index_length(self) - 1;
              	heads = PyList_New(0);
              	if (heads == NULL)
              		goto bail;
              	if (len == 0) {
              		PyObject *nullid = PyInt_FromLong(-1);
              		if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
              			Py_XDECREF(nullid);
              			goto bail;
              		}
              		goto done;
              	}
              	nothead = calloc(len, 1);
              	if (nothead == NULL)
              		goto bail;
              	for (i = 0; i < self->raw_length; i++) {
              		const char *data = index_deref(self, i);
              		int parent_1 = getbe32(data + 24);
              		int parent_2 = getbe32(data + 28);
              		if (parent_1 >= 0)
              			nothead[parent_1] = 1;
              		if (parent_2 >= 0)
              			nothead[parent_2] = 1;
              	}
              	addlen = self->added ? PyList_GET_SIZE(self->added) : 0;
              	for (i = 0; i < addlen; i++) {
              		PyObject *rev = PyList_GET_ITEM(self->added, i);
              		PyObject *p1 = PyTuple_GET_ITEM(rev, 5);
              		PyObject *p2 = PyTuple_GET_ITEM(rev, 6);
              		long parent_1, parent_2;
              		if (!PyInt_Check(p1) || !PyInt_Check(p2)) {
              			PyErr_SetString(PyExc_TypeError,
              					"revlog parents are invalid");
              			goto bail;
              		}
              		parent_1 = PyInt_AS_LONG(p1);
              		parent_2 = PyInt_AS_LONG(p2);
              		if (parent_1 >= 0)
              			nothead[parent_1] = 1;
              		if (parent_2 >= 0)
              			nothead[parent_2] = 1;
              	}
              	for (i = 0; i < len; i++) {
              		PyObject *head;
              		if (nothead[i])
              			continue;
              		head = PyInt_FromLong(i);
              		if (head == NULL || PyList_Append(heads, head) == -1) {
              			Py_XDECREF(head);
              			goto bail;
              		}
              	}
              done:
              	self->headrevs = heads;
              	free(nothead);
              	return list_copy(self->headrevs);
              bail:
              	Py_XDECREF(heads);
              	free(nothead);
              	return NULL;
              }
              static inline int nt_level(const char *node, Py_ssize_t level)
              {
              	int v = node[level>>1];
              	if (!(level & 1))
              		v >>= 4;
              	return v & 0xf;
              }
              /*
               * Return values:
               *
               *   -4: match is ambiguous (multiple candidates)
               *   -2: not found
               * rest: valid rev
               */
              static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
              		   int hex)
              {
              	int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
              	int level, maxlevel, off;
              	if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
              		return -1;
              	if (self->nt == NULL)
              		return -2;
              	if (hex)
              		maxlevel = nodelen > 40 ? 40 : (int)nodelen;
              	else
              		maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
              	for (level = off = 0; level < maxlevel; level++) {
              		int k = getnybble(node, level);
              		nodetree *n = &self->nt[off];
              		int v = n->children[k];
              		if (v < 0) {
              			const char *n;
              			Py_ssize_t i;
              			v = -v - 1;
              			n = index_node(self, v);
              			if (n == NULL)
              				return -2;
              			for (i = level; i < maxlevel; i++)
              				if (getnybble(node, i) != nt_level(n, i))
              					return -2;
              			return v;
              		}
              		if (v == 0)
              			return -2;
              		off = v;
              	}
              	/* multiple matches against an ambiguous prefix */
              	return -4;
              }
              static int nt_new(indexObject *self)
              {
              	if (self->ntlength == self->ntcapacity) {
              		self->ntcapacity *= 2;
              		self->nt = realloc(self->nt,
              				   self->ntcapacity * sizeof(nodetree));
              		if (self->nt == NULL) {
              			PyErr_SetString(PyExc_MemoryError, "out of memory");
              			return -1;
              		}
              		memset(&self->nt[self->ntlength], 0,
              		       sizeof(nodetree) * (self->ntcapacity - self->ntlength));
              	}
              	return self->ntlength++;
              }
              static int nt_insert(indexObject *self, const char *node, int rev)
              {
              	int level = 0;
              	int off = 0;
              	while (level < 40) {
              		int k = nt_level(node, level);
              		nodetree *n;
              		int v;
              		n = &self->nt[off];
              		v = n->children[k];
              		if (v == 0) {
              			n->children[k] = -rev - 1;
              			return 0;
              		}
              		if (v < 0) {
              			const char *oldnode = index_node(self, -v - 1);
              			int noff;
              			if (!oldnode || !memcmp(oldnode, node, 20)) {
              				n->children[k] = -rev - 1;
              				return 0;
              			}
              			noff = nt_new(self);
              			if (noff == -1)
              				return -1;
              			/* self->nt may have been changed by realloc */
              			self->nt[off].children[k] = noff;
              			off = noff;
              			n = &self->nt[off];
              			n->children[nt_level(oldnode, ++level)] = v;
              			if (level > self->ntdepth)
              				self->ntdepth = level;
              			self->ntsplits += 1;
              		} else {
              			level += 1;
              			off = v;
              		}
              	}
              	return -1;
              }
              static int nt_init(indexObject *self)
              {
              	if (self->nt == NULL) {
              		if (self->raw_length > INT_MAX) {
              			PyErr_SetString(PyExc_ValueError, "overflow in nt_init");
              			return -1;
              		}
              		self->ntcapacity = self->raw_length < 4
              			? 4 : (int)self->raw_length / 2;
              		self->nt = calloc(self->ntcapacity, sizeof(nodetree));
              		if (self->nt == NULL) {
              			PyErr_NoMemory();
              			return -1;
              		}
              		self->ntlength = 1;
              		self->ntrev = (int)index_length(self) - 1;
              		self->ntlookups = 1;
              		self->ntmisses = 0;
              		if (nt_insert(self, nullid, INT_MAX) == -1)
              			return -1;
              	}
              	return 0;
              }
              /*
               * Return values:
               *
               *   -3: error (exception set)
               *   -2: not found (no exception set)
               * rest: valid rev
               */
              static int index_find_node(indexObject *self,
              			   const char *node, Py_ssize_t nodelen)
              {
              	int rev;
              	self->ntlookups++;
              	rev = nt_find(self, node, nodelen, 0);
              	if (rev >= -1)
              		return rev;
              	if (nt_init(self) == -1)
              		return -3;
              	/*
              	 * For the first handful of lookups, we scan the entire index,
              	 * and cache only the matching nodes. This optimizes for cases
              	 * like "hg tip", where only a few nodes are accessed.
              	 *
              	 * After that, we cache every node we visit, using a single
              	 * scan amortized over multiple lookups.  This gives the best
              	 * bulk performance, e.g. for "hg log".
              	 */
              	if (self->ntmisses++ < 4) {
              		for (rev = self->ntrev - 1; rev >= 0; rev--) {
              			const char *n = index_node(self, rev);
              			if (n == NULL)
              				return -2;
              			if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
              				if (nt_insert(self, n, rev) == -1)
              					return -3;
              				break;
              			}
              		}
              	} else {
              		for (rev = self->ntrev - 1; rev >= 0; rev--) {
              			const char *n = index_node(self, rev);
              			if (n == NULL) {
              				self->ntrev = rev + 1;
              				return -2;
              			}
              			if (nt_insert(self, n, rev) == -1) {
              				self->ntrev = rev + 1;
              				return -3;
              			}
              			if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
              				break;
              			}
              		}
              		self->ntrev = rev;
              	}
              	if (rev >= 0)
              		return rev;
              	return -2;
              }
              static PyObject *raise_revlog_error(void)
              {
              	static PyObject *errclass;
              	PyObject *mod = NULL, *errobj;
              	if (errclass == NULL) {
              		PyObject *dict;
              		mod = PyImport_ImportModule("mercurial.error");
              		if (mod == NULL)
              			goto classfail;
              		dict = PyModule_GetDict(mod);
              		if (dict == NULL)
              			goto classfail;
              		errclass = PyDict_GetItemString(dict, "RevlogError");
              		if (errclass == NULL) {
              			PyErr_SetString(PyExc_SystemError,
              					"could not find RevlogError");
              			goto classfail;
              		}
              		Py_INCREF(errclass);
              	}
              	errobj = PyObject_CallFunction(errclass, NULL);
              	if (errobj == NULL)
              		return NULL;
              	PyErr_SetObject(errclass, errobj);
              	return errobj;
              classfail:
              	Py_XDECREF(mod);
              	return NULL;
              }
              static PyObject *index_getitem(indexObject *self, PyObject *value)
              {
              	char *node;
              	Py_ssize_t nodelen;
              	int rev;
              	if (PyInt_Check(value))
              		return index_get(self, PyInt_AS_LONG(value));
              	if (node_check(value, &node, &nodelen) == -1)
              		return NULL;
              	rev = index_find_node(self, node, nodelen);
              	if (rev >= -1)
              		return PyInt_FromLong(rev);
              	if (rev == -2)
              		raise_revlog_error();
              	return NULL;
              }
              static int nt_partialmatch(indexObject *self, const char *node,
              			   Py_ssize_t nodelen)
              {
              	int rev;
              	if (nt_init(self) == -1)
              		return -3;
              	if (self->ntrev > 0) {
              		/* ensure that the radix tree is fully populated */
              		for (rev = self->ntrev - 1; rev >= 0; rev--) {
              			const char *n = index_node(self, rev);
              			if (n == NULL)
              				return -2;
              			if (nt_insert(self, n, rev) == -1)
              				return -3;
              		}
              		self->ntrev = rev;
              	}
              	return nt_find(self, node, nodelen, 1);
              }
              static PyObject *index_partialmatch(indexObject *self, PyObject *args)
              {
              	const char *fullnode;
              	int nodelen;
              	char *node;
              	int rev, i;
              	if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
              		return NULL;
              	if (nodelen < 4) {
              		PyErr_SetString(PyExc_ValueError, "key too short");
              		return NULL;
              	}
              	if (nodelen > 40) {
              		PyErr_SetString(PyExc_ValueError, "key too long");
              		return NULL;
              	}
              	for (i = 0; i < nodelen; i++)
              		hexdigit(node, i);
              	if (PyErr_Occurred()) {
              		/* input contains non-hex characters */
              		PyErr_Clear();
              		Py_RETURN_NONE;
              	}
              	rev = nt_partialmatch(self, node, nodelen);
              	switch (rev) {
              	case -4:
              		raise_revlog_error();
              	case -3:
              		return NULL;
              	case -2:
              		Py_RETURN_NONE;
              	case -1:
              		return PyString_FromStringAndSize(nullid, 20);
              	}
              	fullnode = index_node(self, rev);
              	if (fullnode == NULL) {
              		PyErr_Format(PyExc_IndexError,
              			     "could not access rev %d", rev);
              		return NULL;
              	}
              	return PyString_FromStringAndSize(fullnode, 20);
              }
              static PyObject *index_m_get(indexObject *self, PyObject *args)
              {
              	Py_ssize_t nodelen;
              	PyObject *val;
              	char *node;
              	int rev;
              	if (!PyArg_ParseTuple(args, "O", &val))
              		return NULL;
              	if (node_check(val, &node, &nodelen) == -1)
              		return NULL;
              	rev = index_find_node(self, node, nodelen);
              	if (rev ==  -3)
              		return NULL;
              	if (rev == -2)
              		Py_RETURN_NONE;
              	return PyInt_FromLong(rev);
              }
              static int index_contains(indexObject *self, PyObject *value)
              {
              	char *node;
              	Py_ssize_t nodelen;
              	if (PyInt_Check(value)) {
              		long rev = PyInt_AS_LONG(value);
              		return rev >= -1 && rev < index_length(self);
              	}
              	if (node_check(value, &node, &nodelen) == -1)
              		return -1;
              	switch (index_find_node(self, node, nodelen)) {
              	case -3:
              		return -1;
              	case -2:
              		return 0;
              	default:
              		return 1;
              	}
              }
              static inline void index_get_parents(indexObject *self, int rev, int *ps)
              {
              	if (rev >= self->length - 1) {
              		PyObject *tuple = PyList_GET_ITEM(self->added,
              						  rev - self->length + 1);
              		ps[0] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 5));
              		ps[1] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 6));
              	} else {
              		const char *data = index_deref(self, rev);
              		ps[0] = getbe32(data + 24);
              		ps[1] = getbe32(data + 28);
              	}
              }
              typedef uint64_t bitmask;
              /*
               * Given a disjoint set of revs, return all candidates for the
               * greatest common ancestor. In revset notation, this is the set
               * "heads(::a and ::b and ...)"
               */
              static PyObject *find_gca_candidates(indexObject *self, const int *revs,
              				     int revcount)
              {
              	const bitmask allseen = (1ull << revcount) - 1;
              	const bitmask poison = 1ull << revcount;
              	PyObject *gca = PyList_New(0);
              	int i, v, interesting;
              	int maxrev = -1;
              	long sp;
              	bitmask *seen;
              	if (gca == NULL)
              		return PyErr_NoMemory();
              	for (i = 0; i < revcount; i++) {
              		if (revs[i] > maxrev)
              			maxrev = revs[i];
              	}
              	seen = calloc(sizeof(*seen), maxrev + 1);
              	if (seen == NULL) {
              		Py_DECREF(gca);
              		return PyErr_NoMemory();
              	}
              	for (i = 0; i < revcount; i++)
              		seen[revs[i]] = 1ull << i;
              	interesting = revcount;
              	for (v = maxrev; v >= 0 && interesting; v--) {
              		long sv = seen[v];
              		int parents[2];
              		if (!sv)
              			continue;
              		if (sv < poison) {
              			interesting -= 1;
              			if (sv == allseen) {
              				PyObject *obj = PyInt_FromLong(v);
              				if (obj == NULL)
              					goto bail;
              				if (PyList_Append(gca, obj) == -1) {
              					Py_DECREF(obj);
              					goto bail;
              				}
              				sv |= poison;
              				for (i = 0; i < revcount; i++) {
              					if (revs[i] == v)
              						goto done;
              				}
              			}
              		}
              		index_get_parents(self, v, parents);
              		for (i = 0; i < 2; i++) {
              			int p = parents[i];
              			if (p == -1)
              				continue;
              			sp = seen[p];
              			if (sv < poison) {
              				if (sp == 0) {
              					seen[p] = sv;
              					interesting++;
              				}
              				else if (sp != sv)
              					seen[p] |= sv;
              			} else {
              				if (sp && sp < poison)
              					interesting--;
              				seen[p] = sv;
              			}
              		}
              	}
              done:
              	free(seen);
              	return gca;
              bail:
              	free(seen);
              	Py_XDECREF(gca);
              	return NULL;
              }
              /*
               * Given a disjoint set of revs, return the subset with the longest
               * path to the root.
               */
              static PyObject *find_deepest(indexObject *self, PyObject *revs)
              {
              	const Py_ssize_t revcount = PyList_GET_SIZE(revs);
              	static const Py_ssize_t capacity = 24;
              	int *depth, *interesting = NULL;
              	int i, j, v, ninteresting;
              	PyObject *dict = NULL, *keys = NULL;
              	long *seen = NULL;
              	int maxrev = -1;
              	long final;
              	if (revcount > capacity) {
              		PyErr_Format(PyExc_OverflowError,
              			     "bitset size (%ld) > capacity (%ld)",
              			     (long)revcount, (long)capacity);
              		return NULL;
              	}
              	for (i = 0; i < revcount; i++) {
              		int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
              		if (n > maxrev)
              			maxrev = n;
              	}
              	depth = calloc(sizeof(*depth), maxrev + 1);
              	if (depth == NULL)
              		return PyErr_NoMemory();
              	seen = calloc(sizeof(*seen), maxrev + 1);
              	if (seen == NULL) {
              		PyErr_NoMemory();
              		goto bail;
              	}
              	interesting = calloc(sizeof(*interesting), 2 << revcount);
              	if (interesting == NULL) {
              		PyErr_NoMemory();
              		goto bail;
              	}
              	if (PyList_Sort(revs) == -1)
              		goto bail;
              	for (i = 0; i < revcount; i++) {
              		int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
              		long b = 1l << i;
              		depth[n] = 1;
              		seen[n] = b;
              		interesting[b] = 1;
              	}
              	ninteresting = (int)revcount;
              	for (v = maxrev; v >= 0 && ninteresting > 1; v--) {
              		int dv = depth[v];
              		int parents[2];
              		long sv;
              		if (dv == 0)
              			continue;
              		sv = seen[v];
              		index_get_parents(self, v, parents);
              		for (i = 0; i < 2; i++) {
              			int p = parents[i];
              			long nsp, sp;
              			int dp;
              			if (p == -1)
              				continue;
              			dp = depth[p];
              			nsp = sp = seen[p];
              			if (dp <= dv) {
              				depth[p] = dv + 1;
              				if (sp != sv) {
              					interesting[sv] += 1;
              					nsp = seen[p] = sv;
              					if (sp) {
              						interesting[sp] -= 1;
              						if (interesting[sp] == 0)
              							ninteresting -= 1;
              					}
              				}
              			}
              			else if (dv == dp - 1) {
              				nsp = sp | sv;
              				if (nsp == sp)
              					continue;
              				seen[p] = nsp;
              				interesting[sp] -= 1;
              				if (interesting[sp] == 0 && interesting[nsp] > 0)
              					ninteresting -= 1;
              				interesting[nsp] += 1;
              			}
              		}
              		interesting[sv] -= 1;
              		if (interesting[sv] == 0)
              			ninteresting -= 1;
              	}
              	final = 0;
              	j = ninteresting;
              	for (i = 0; i < (int)(2 << revcount) && j > 0; i++) {
              		if (interesting[i] == 0)
              			continue;
              		final |= i;
              		j -= 1;
              	}
              	if (final == 0) {
              		keys = PyList_New(0);
              		goto bail;
              	}
              	dict = PyDict_New();
              	if (dict == NULL)
              		goto bail;
              	for (i = 0; i < revcount; i++) {
              		PyObject *key;
              		if ((final & (1 << i)) == 0)
              			continue;
              		key = PyList_GET_ITEM(revs, i);
              		Py_INCREF(key);
              		Py_INCREF(Py_None);
              		if (PyDict_SetItem(dict, key, Py_None) == -1) {
              			Py_DECREF(key);
              			Py_DECREF(Py_None);
              			goto bail;
              		}
              	}
              	keys = PyDict_Keys(dict);
              bail:
              	free(depth);
              	free(seen);
              	free(interesting);
              	Py_XDECREF(dict);
              	return keys;
              }
              /*
               * Given a (possibly overlapping) set of revs, return the greatest
               * common ancestors: those with the longest path to the root.
               */
              static PyObject *index_ancestors(indexObject *self, PyObject *args)
              {
              	PyObject *ret = NULL, *gca = NULL;
              	Py_ssize_t argcount, i, len;
              	bitmask repeat = 0;
              	int revcount = 0;
              	int *revs;
              	argcount = PySequence_Length(args);
              	revs = malloc(argcount * sizeof(*revs));
              	if (argcount > 0 && revs == NULL)
              		return PyErr_NoMemory();
              	len = index_length(self) - 1;
              	for (i = 0; i < argcount; i++) {
              		static const int capacity = 24;
              		PyObject *obj = PySequence_GetItem(args, i);
              		bitmask x;
              		long val;
              		if (!PyInt_Check(obj)) {
              			PyErr_SetString(PyExc_TypeError,
              					"arguments must all be ints");
              			goto bail;
              		}
              		val = PyInt_AsLong(obj);
              		if (val == -1) {
              			ret = PyList_New(0);
              			goto done;
              		}
              		if (val < 0 || val >= len) {
              			PyErr_SetString(PyExc_IndexError,
              					"index out of range");
              			goto bail;
              		}
              		/* this cheesy bloom filter lets us avoid some more
              		 * expensive duplicate checks in the common set-is-disjoint
              		 * case */
              		x = 1ull << (val & 0x3f);
              		if (repeat & x) {
              			int k;
              			for (k = 0; k < revcount; k++) {
              				if (val == revs[k])
              					goto duplicate;
              			}
              		}
              		else repeat |= x;
              		if (revcount >= capacity) {
              			PyErr_Format(PyExc_OverflowError,
              				     "bitset size (%d) > capacity (%d)",
              				     revcount, capacity);
              			goto bail;
              		}
              		revs[revcount++] = (int)val;
              	duplicate:;
              	}
              	if (revcount == 0) {
              		ret = PyList_New(0);
              		goto done;
              	}
              	if (revcount == 1) {
              		PyObject *obj;
              		ret = PyList_New(1);
              		if (ret == NULL)
              			goto bail;
              		obj = PyInt_FromLong(revs[0]);
              		if (obj == NULL)
              			goto bail;
              		PyList_SET_ITEM(ret, 0, obj);
              		goto done;
              	}
              	gca = find_gca_candidates(self, revs, revcount);
              	if (gca == NULL)
              		goto bail;
              	if (PyList_GET_SIZE(gca) <= 1) {
              		ret = gca;
              		Py_INCREF(gca);
              	}
              	else ret = find_deepest(self, gca);
              done:
              	free(revs);
              	Py_XDECREF(gca);
              	return ret;
              bail:
              	free(revs);
              	Py_XDECREF(gca);
              	Py_XDECREF(ret);
              	return NULL;
              }
              /*
               * Given a (possibly overlapping) set of revs, return all the
               * common ancestors heads: heads(::args[0] and ::a[1] and ...)
               */
              static PyObject *index_commonancestorsheads(indexObject *self, PyObject *args)
              {
              	PyObject *ret = NULL;
              	Py_ssize_t argcount, i, len;
              	bitmask repeat = 0;
              	int revcount = 0;
              	int *revs;
              	argcount = PySequence_Length(args);
              	revs = malloc(argcount * sizeof(*revs));
              	if (argcount > 0 && revs == NULL)
              		return PyErr_NoMemory();
              	len = index_length(self) - 1;
              	for (i = 0; i < argcount; i++) {
              		static const int capacity = 24;
              		PyObject *obj = PySequence_GetItem(args, i);
              		bitmask x;
              		long val;
              		if (!PyInt_Check(obj)) {
              			PyErr_SetString(PyExc_TypeError,
              					"arguments must all be ints");
              			goto bail;
              		}
              		val = PyInt_AsLong(obj);
              		if (val == -1) {
              			ret = PyList_New(0);
              			goto done;
              		}
              		if (val < 0 || val >= len) {
              			PyErr_SetString(PyExc_IndexError,
              					"index out of range");
              			goto bail;
              		}
              		/* this cheesy bloom filter lets us avoid some more
              		 * expensive duplicate checks in the common set-is-disjoint
              		 * case */
              		x = 1ull << (val & 0x3f);
              		if (repeat & x) {
              			int k;
              			for (k = 0; k < revcount; k++) {
              				if (val == revs[k])
              					goto duplicate;
              			}
              		}
              		else repeat |= x;
              		if (revcount >= capacity) {
              			PyErr_Format(PyExc_OverflowError,
              				     "bitset size (%d) > capacity (%d)",
              				     revcount, capacity);
              			goto bail;
              		}
              		revs[revcount++] = (int)val;
              	duplicate:;
              	}
              	if (revcount == 0) {
              		ret = PyList_New(0);
              		goto done;
              	}
              	if (revcount == 1) {
              		PyObject *obj;
              		ret = PyList_New(1);
              		if (ret == NULL)
              			goto bail;
              		obj = PyInt_FromLong(revs[0]);
              		if (obj == NULL)
              			goto bail;
              		PyList_SET_ITEM(ret, 0, obj);
              		goto done;
              	}
              	ret = find_gca_candidates(self, revs, revcount);
              	if (ret == NULL)
              		goto bail;
              done:
              	free(revs);
              	return ret;
              bail:
              	free(revs);
              	Py_XDECREF(ret);
              	return NULL;
              }
              /*
               * Invalidate any trie entries introduced by added revs.
               */
              static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
              {
              	Py_ssize_t i, len = PyList_GET_SIZE(self->added);
              	for (i = start; i < len; i++) {
              		PyObject *tuple = PyList_GET_ITEM(self->added, i);
              		PyObject *node = PyTuple_GET_ITEM(tuple, 7);
              		nt_insert(self, PyString_AS_STRING(node), -1);
              	}
              	if (start == 0)
              		Py_CLEAR(self->added);
              }
              /*
               * Delete a numeric range of revs, which must be at the end of the
               * range, but exclude the sentinel nullid entry.
               */
              static int index_slice_del(indexObject *self, PyObject *item)
              {
              	Py_ssize_t start, stop, step, slicelength;
              	Py_ssize_t length = index_length(self);
              	int ret = 0;
              	if (PySlice_GetIndicesEx((PySliceObject*)item, length,
              				 &start, &stop, &step, &slicelength) < 0)
              		return -1;
              	if (slicelength <= 0)
              		return 0;
              	if ((step < 0 && start < stop) || (step > 0 && start > stop))
              		stop = start;
              	if (step < 0) {
              		stop = start + 1;
              		start = stop + step*(slicelength - 1) - 1;
              		step = -step;
              	}
              	if (step != 1) {
              		PyErr_SetString(PyExc_ValueError,
              				"revlog index delete requires step size of 1");
              		return -1;
              	}
              	if (stop != length - 1) {
              		PyErr_SetString(PyExc_IndexError,
              				"revlog index deletion indices are invalid");
              		return -1;
              	}
              	if (start < self->length - 1) {
              		if (self->nt) {
              			Py_ssize_t i;
              			for (i = start + 1; i < self->length - 1; i++) {
              				const char *node = index_node(self, i);
              				if (node)
              					nt_insert(self, node, -1);
              			}
              			if (self->added)
              				nt_invalidate_added(self, 0);
              			if (self->ntrev > start)
              				self->ntrev = (int)start;
              		}
              		self->length = start + 1;
              		if (start < self->raw_length) {
              			if (self->cache) {
              				Py_ssize_t i;
              				for (i = start; i < self->raw_length; i++)
              					Py_CLEAR(self->cache[i]);
              			}
              			self->raw_length = start;
              		}
              		goto done;
              	}
              	if (self->nt) {
              		nt_invalidate_added(self, start - self->length + 1);
              		if (self->ntrev > start)
              			self->ntrev = (int)start;
              	}
              	if (self->added)
              		ret = PyList_SetSlice(self->added, start - self->length + 1,
              				      PyList_GET_SIZE(self->added), NULL);
              done:
              	Py_CLEAR(self->headrevs);
              	return ret;
              }
              /*
               * Supported ops:
               *
               * slice deletion
               * string assignment (extend node->rev mapping)
               * string deletion (shrink node->rev mapping)
               */
              static int index_assign_subscript(indexObject *self, PyObject *item,
              				  PyObject *value)
              {
              	char *node;
              	Py_ssize_t nodelen;
              	long rev;
              	if (PySlice_Check(item) && value == NULL)
              		return index_slice_del(self, item);
              	if (node_check(item, &node, &nodelen) == -1)
              		return -1;
              	if (value == NULL)
              		return self->nt ? nt_insert(self, node, -1) : 0;
              	rev = PyInt_AsLong(value);
              	if (rev > INT_MAX || rev < 0) {
              		if (!PyErr_Occurred())
              			PyErr_SetString(PyExc_ValueError, "rev out of range");
              		return -1;
              	}
              	return nt_insert(self, node, (int)rev);
              }
              /*
               * Find all RevlogNG entries in an index that has inline data. Update
               * the optional "offsets" table with those entries.
               */
              static long inline_scan(indexObject *self, const char **offsets)
              {
              	const char *data = PyString_AS_STRING(self->data);
              	Py_ssize_t pos = 0;
              	Py_ssize_t end = PyString_GET_SIZE(self->data);
              	long incr = v1_hdrsize;
              	Py_ssize_t len = 0;
              	while (pos + v1_hdrsize <= end && pos >= 0) {
              		uint32_t comp_len;
              		/* 3rd element of header is length of compressed inline data */
              		comp_len = getbe32(data + pos + 8);
              		incr = v1_hdrsize + comp_len;
              		if (offsets)
              			offsets[len] = data + pos;
              		len++;
              		pos += incr;
              	}
              	if (pos != end) {
              		if (!PyErr_Occurred())
              			PyErr_SetString(PyExc_ValueError, "corrupt index file");
              		return -1;
              	}
              	return len;
              }
              static int index_init(indexObject *self, PyObject *args)
              {
              	PyObject *data_obj, *inlined_obj;
              	Py_ssize_t size;
              	/* Initialize before argument-checking to avoid index_dealloc() crash. */
              	self->raw_length = 0;
              	self->added = NULL;
              	self->cache = NULL;
              	self->data = NULL;
              	self->headrevs = NULL;
              	self->nt = NULL;
              	self->offsets = NULL;
              	if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
              		return -1;
              	if (!PyString_Check(data_obj)) {
              		PyErr_SetString(PyExc_TypeError, "data is not a string");
              		return -1;
              	}
              	size = PyString_GET_SIZE(data_obj);
              	self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
              	self->data = data_obj;
              	self->ntlength = self->ntcapacity = 0;
              	self->ntdepth = self->ntsplits = 0;
              	self->ntlookups = self->ntmisses = 0;
              	self->ntrev = -1;
              	Py_INCREF(self->data);
              	if (self->inlined) {
              		long len = inline_scan(self, NULL);
              		if (len == -1)
              			goto bail;
              		self->raw_length = len;
              		self->length = len + 1;
              	} else {
              		if (size % v1_hdrsize) {
              			PyErr_SetString(PyExc_ValueError, "corrupt index file");
              			goto bail;
              		}
              		self->raw_length = size / v1_hdrsize;
              		self->length = self->raw_length + 1;
              	}
              	return 0;
              bail:
              	return -1;
              }
              static PyObject *index_nodemap(indexObject *self)
              {
              	Py_INCREF(self);
              	return (PyObject *)self;
              }
              static void index_dealloc(indexObject *self)
              {
              	_index_clearcaches(self);
              	Py_XDECREF(self->data);
              	Py_XDECREF(self->added);
              	PyObject_Del(self);
              }
              static PySequenceMethods index_sequence_methods = {
              	(lenfunc)index_length,   /* sq_length */
 ,                       /* sq_concat */
 ,                       /* sq_repeat */
              	(ssizeargfunc)index_get, /* sq_item */
 ,                       /* sq_slice */
 ,                       /* sq_ass_item */
 ,                       /* sq_ass_slice */
              	(objobjproc)index_contains, /* sq_contains */
              };
              static PyMappingMethods index_mapping_methods = {
              	(lenfunc)index_length,                 /* mp_length */
              	(binaryfunc)index_getitem,             /* mp_subscript */
              	(objobjargproc)index_assign_subscript, /* mp_ass_subscript */
              };
              static PyMethodDef index_methods[] = {
              	{"ancestors", (PyCFunction)index_ancestors, METH_VARARGS,
              	 "return the gca set of the given revs"},
              	{"commonancestorsheads", (PyCFunction)index_commonancestorsheads,
              	  METH_VARARGS,
              	  "return the heads of the common ancestors of the given revs"},
              	{"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
              	 "clear the index caches"},
              	{"get", (PyCFunction)index_m_get, METH_VARARGS,
              	 "get an index entry"},
              	{"headrevs", (PyCFunction)index_headrevs, METH_NOARGS,
              	 "get head revisions"},
              	{"insert", (PyCFunction)index_insert, METH_VARARGS,
              	 "insert an index entry"},
              	{"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
              	 "match a potentially ambiguous node ID"},
              	{"stats", (PyCFunction)index_stats, METH_NOARGS,
              	 "stats for the index"},
              	{NULL} /* Sentinel */
              };
              static PyGetSetDef index_getset[] = {
              	{"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
              	{NULL} /* Sentinel */
              };
              static PyTypeObject indexType = {
              	PyObject_HEAD_INIT(NULL)
 ,                         /* ob_size */
              	"parsers.index",           /* tp_name */
              	sizeof(indexObject),       /* tp_basicsize */
 ,                         /* tp_itemsize */
              	(destructor)index_dealloc, /* tp_dealloc */
 ,                         /* tp_print */
 ,                         /* tp_getattr */
 ,                         /* tp_setattr */
 ,                         /* tp_compare */
 ,                         /* tp_repr */
 ,                         /* tp_as_number */
              	&index_sequence_methods,   /* tp_as_sequence */
              	&index_mapping_methods,    /* tp_as_mapping */
 ,                         /* tp_hash */
 ,                         /* tp_call */
 ,                         /* tp_str */
 ,                         /* tp_getattro */
 ,                         /* tp_setattro */
 ,                         /* tp_as_buffer */
              	Py_TPFLAGS_DEFAULT,        /* tp_flags */
              	"revlog index",            /* tp_doc */
 ,                         /* tp_traverse */
 ,                         /* tp_clear */
 ,                         /* tp_richcompare */
 ,                         /* tp_weaklistoffset */
 ,                         /* tp_iter */
 ,                         /* tp_iternext */
              	index_methods,             /* tp_methods */
 ,                         /* tp_members */
              	index_getset,              /* tp_getset */
 ,                         /* tp_base */
 ,                         /* tp_dict */
 ,                         /* tp_descr_get */
 ,                         /* tp_descr_set */
 ,                         /* tp_dictoffset */
              	(initproc)index_init,      /* tp_init */
 ,                         /* tp_alloc */
              };
              /*
               * returns a tuple of the form (index, index, cache) with elements as
               * follows:
               *
               * index: an index object that lazily parses RevlogNG records
               * cache: if data is inlined, a tuple (index_file_content, 0), else None
               *
               * added complications are for backwards compatibility
               */
              static PyObject *parse_index2(PyObject *self, PyObject *args)
              {
              	PyObject *tuple = NULL, *cache = NULL;
              	indexObject *idx;
              	int ret;
              	idx = PyObject_New(indexObject, &indexType);
              	if (idx == NULL)
              		goto bail;
              	ret = index_init(idx, args);
              	if (ret == -1)
              		goto bail;
              	if (idx->inlined) {
              		cache = Py_BuildValue("iO", 0, idx->data);
              		if (cache == NULL)
              			goto bail;
              	} else {
              		cache = Py_None;
              		Py_INCREF(cache);
              	}
              	tuple = Py_BuildValue("NN", idx, cache);
              	if (!tuple)
              		goto bail;
              	return tuple;
              bail:
              	Py_XDECREF(idx);
              	Py_XDECREF(cache);
              	Py_XDECREF(tuple);
              	return NULL;
              }
              static char parsers_doc[] = "Efficient content parsing.";
              PyObject *encodedir(PyObject *self, PyObject *args);
              PyObject *pathencode(PyObject *self, PyObject *args);
              PyObject *lowerencode(PyObject *self, PyObject *args);
              static PyMethodDef methods[] = {
              	{"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
              	{"parse_manifest", parse_manifest, METH_VARARGS, "parse a manifest\n"},
              	{"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
              	{"parse_index2", parse_index2, METH_VARARGS, "parse a revlog index\n"},
              	{"encodedir", encodedir, METH_VARARGS, "encodedir a path\n"},
              	{"pathencode", pathencode, METH_VARARGS, "fncache-encode a path\n"},
              	{"lowerencode", lowerencode, METH_VARARGS, "lower-encode a path\n"},
              	{NULL, NULL}
              };
              void dirs_module_init(PyObject *mod);
              static void module_init(PyObject *mod)
              {
              	/* This module constant has two purposes.  First, it lets us unit test
              	 * the ImportError raised without hard-coding any error text.  This
              	 * means we can change the text in the future without breaking tests,
              	 * even across changesets without a recompile.  Second, its presence
              	 * can be used to determine whether the version-checking logic is
              	 * present, which also helps in testing across changesets without a
              	 * recompile.  Note that this means the pure-Python version of parsers
              	 * should not have this module constant. */
              	PyModule_AddStringConstant(mod, "versionerrortext", versionerrortext);
              	dirs_module_init(mod);
              	indexType.tp_new = PyType_GenericNew;
-             	if (PyType_Ready(&indexType) < 0)
+             	if (PyType_Ready(&indexType) < 0 ||
+             	    PyType_Ready(&dirstateTupleType) < 0)
              		return;
              	Py_INCREF(&indexType);
              	PyModule_AddObject(mod, "index", (PyObject *)&indexType);
+             	Py_INCREF(&dirstateTupleType);
+             	PyModule_AddObject(mod, "dirstatetuple",
+             			   (PyObject *)&dirstateTupleType);
              	nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
              				  -1, -1, -1, -1, nullid, 20);
              	if (nullentry)
              		PyObject_GC_UnTrack(nullentry);
              }
              static int check_python_version(void)
              {
              	PyObject *sys = PyImport_ImportModule("sys");
              	long hexversion = PyInt_AsLong(PyObject_GetAttrString(sys, "hexversion"));
              	/* sys.hexversion is a 32-bit number by default, so the -1 case
              	 * should only occur in unusual circumstances (e.g. if sys.hexversion
              	 * is manually set to an invalid value). */
              	if ((hexversion == -1) || (hexversion >> 16 != PY_VERSION_HEX >> 16)) {
              		PyErr_Format(PyExc_ImportError, "%s: The Mercurial extension "
              			"modules were compiled with Python " PY_VERSION ", but "
              			"Mercurial is currently using Python with sys.hexversion=%ld: "
              			"Python %s\n at: %s", versionerrortext, hexversion,
              			Py_GetVersion(), Py_GetProgramFullPath());
              		return -1;
              	}
              	return 0;
              }
              #ifdef IS_PY3K
              static struct PyModuleDef parsers_module = {
              	PyModuleDef_HEAD_INIT,
              	"parsers",
              	parsers_doc,
              	-1,
              	methods
              };
              PyMODINIT_FUNC PyInit_parsers(void)
              {
              	PyObject *mod;
              	if (check_python_version() == -1)
              		return;
              	mod = PyModule_Create(&parsers_module);
              	module_init(mod);
              	return mod;
              }
              #else
              PyMODINIT_FUNC initparsers(void)
              {
              	PyObject *mod;
              	if (check_python_version() == -1)
              		return;
              	mod = Py_InitModule3("parsers", methods, parsers_doc);
              	module_init(mod);
              }
              #endif

mercurial/pure/parsers.py

0 +7 -1

              # parsers.py - Python implementation of parsers.c
              #
              # Copyright 2009 Matt Mackall <mpm@selenic.com> and others
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from mercurial.node import bin, nullid
              from mercurial import util
              import struct, zlib, cStringIO
              _pack = struct.pack
              _unpack = struct.unpack
              _compress = zlib.compress
              _decompress = zlib.decompress
              _sha = util.sha1
+             # Some code below makes tuples directly because it's more convenient. However,
+             # code outside this module should always use dirstatetuple.
+             def dirstatetuple(*x):
+                 # x is a tuple
+                 return x
              def parse_manifest(mfdict, fdict, lines):
                  for l in lines.splitlines():
                      f, n = l.split('\0')
                      if len(n) > 40:
                          fdict[f] = n[40:]
                          mfdict[f] = bin(n[:40])
                      else:
                          mfdict[f] = bin(n)
              def parse_index2(data, inline):
                  def gettype(q):
                      return int(q & 0xFFFF)
                  def offset_type(offset, type):
                      return long(long(offset) << 16 | type)
                  indexformatng = ">Qiiiiii20s12x"
                  s = struct.calcsize(indexformatng)
                  index = []
                  cache = None
                  off = 0
                  l = len(data) - s
                  append = index.append
                  if inline:
                      cache = (0, data)
                      while off <= l:
                          e = _unpack(indexformatng, data[off:off + s])
                          append(e)
                          if e[1] < 0:
                              break
                          off += e[1] + s
                  else:
                      while off <= l:
                          e = _unpack(indexformatng, data[off:off + s])
                          append(e)
                          off += s
                  if off != len(data):
                      raise ValueError('corrupt index file')
                  if index:
                      e = list(index[0])
                      type = gettype(e[0])
                      e[0] = offset_type(0, type)
                      index[0] = tuple(e)
                  # add the magic null revision at -1
                  index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                  return index, cache
              def parse_dirstate(dmap, copymap, st):
                  parents = [st[:20], st[20: 40]]
                  # dereference fields so they will be local in loop
                  format = ">cllll"
                  e_size = struct.calcsize(format)
                  pos1 = 40
                  l = len(st)
                  # the inner loop
                  while pos1 < l:
                      pos2 = pos1 + e_size
                      e = _unpack(">cllll", st[pos1:pos2]) # a literal here is faster
                      pos1 = pos2 + e[4]
                      f = st[pos2:pos1]
                      if '\0' in f:
                          f, c = f.split('\0')
                          copymap[f] = c
                      dmap[f] = e[:4]
                  return parents
              def pack_dirstate(dmap, copymap, pl, now):
                  now = int(now)
                  cs = cStringIO.StringIO()
                  write = cs.write
                  write("".join(pl))
                  for f, e in dmap.iteritems():
                      if e[0] == 'n' and e[3] == now:
                          # The file was last modified "simultaneously" with the current
                          # write to dirstate (i.e. within the same second for file-
                          # systems with a granularity of 1 sec). This commonly happens
                          # for at least a couple of files on 'update'.
                          # The user could change the file without changing its size
                          # within the same second. Invalidate the file's mtime in
                          # dirstate, forcing future 'status' calls to compare the
                          # contents of the file if the size is the same. This prevents
                          # mistakenly treating such files as clean.
-                         e = (e[0], e[1], e[2], -1)
+                         e = dirstatetuple(e[0], e[1], e[2], -1)
                          dmap[f] = e
                      if f in copymap:
                          f = "%s\0%s" % (f, copymap[f])
                      e = _pack(">cllll", e[0], e[1], e[2], e[3], len(f))
                      write(e)
                      write(f)
                  return cs.getvalue()

mercurial/util.h

0 +11 0

              /*
               util.h - utility functions for interfacing with the various python APIs.
               This software may be used and distributed according to the terms of
               the GNU General Public License, incorporated herein by reference.
              */
              #ifndef _HG_UTIL_H_
              #define _HG_UTIL_H_
              #if PY_MAJOR_VERSION >= 3
              #define IS_PY3K
              #define PyInt_FromLong PyLong_FromLong
              #define PyInt_AsLong PyLong_AsLong
              /*
               Mapping of some of the python < 2.x PyString* functions to py3k's PyUnicode.
               The commented names below represent those that are present in the PyBytes
               definitions for python < 2.6 (below in this file) that don't have a direct
               implementation.
              */
              #define PyStringObject PyUnicodeObject
              #define PyString_Type PyUnicode_Type
              #define PyString_Check PyUnicode_Check
              #define PyString_CheckExact PyUnicode_CheckExact
              #define PyString_CHECK_INTERNED PyUnicode_CHECK_INTERNED
              #define PyString_AS_STRING PyUnicode_AsLatin1String
              #define PyString_GET_SIZE PyUnicode_GET_SIZE
              #define PyString_FromStringAndSize PyUnicode_FromStringAndSize
              #define PyString_FromString PyUnicode_FromString
              #define PyString_FromFormatV PyUnicode_FromFormatV
              #define PyString_FromFormat PyUnicode_FromFormat
              /* #define PyString_Size PyUnicode_GET_SIZE */
              /* #define PyString_AsString */
              /* #define PyString_Repr */
              #define PyString_Concat PyUnicode_Concat
              #define PyString_ConcatAndDel PyUnicode_AppendAndDel
              #define _PyString_Resize PyUnicode_Resize
              /* #define _PyString_Eq */
              #define PyString_Format PyUnicode_Format
              /* #define _PyString_FormatLong */
              /* #define PyString_DecodeEscape */
              #define _PyString_Join PyUnicode_Join
              #define PyString_Decode PyUnicode_Decode
              #define PyString_Encode PyUnicode_Encode
              #define PyString_AsEncodedObject PyUnicode_AsEncodedObject
              #define PyString_AsEncodedString PyUnicode_AsEncodedString
              #define PyString_AsDecodedObject PyUnicode_AsDecodedObject
              #define PyString_AsDecodedString PyUnicode_AsDecodedUnicode
              /* #define PyString_AsStringAndSize */
              #define _PyString_InsertThousandsGrouping _PyUnicode_InsertThousandsGrouping
              #endif /* PY_MAJOR_VERSION */
              /* Backports from 2.6 */
              #if PY_VERSION_HEX < 0x02060000
              #define Py_TYPE(ob) (ob)->ob_type
              #define Py_SIZE(ob) (ob)->ob_size
              #define PyVarObject_HEAD_INIT(type, size) PyObject_HEAD_INIT(type) size,
              /* Shamelessly stolen from bytesobject.h */
              #define PyBytesObject PyStringObject
              #define PyBytes_Type PyString_Type
              #define PyBytes_Check PyString_Check
              #define PyBytes_CheckExact PyString_CheckExact
              #define PyBytes_CHECK_INTERNED PyString_CHECK_INTERNED
              #define PyBytes_AS_STRING PyString_AS_STRING
              #define PyBytes_GET_SIZE PyString_GET_SIZE
              #define Py_TPFLAGS_BYTES_SUBCLASS Py_TPFLAGS_STRING_SUBCLASS
              #define PyBytes_FromStringAndSize PyString_FromStringAndSize
              #define PyBytes_FromString PyString_FromString
              #define PyBytes_FromFormatV PyString_FromFormatV
              #define PyBytes_FromFormat PyString_FromFormat
              #define PyBytes_Size PyString_Size
              #define PyBytes_AsString PyString_AsString
              #define PyBytes_Repr PyString_Repr
              #define PyBytes_Concat PyString_Concat
              #define PyBytes_ConcatAndDel PyString_ConcatAndDel
              #define _PyBytes_Resize _PyString_Resize
              #define _PyBytes_Eq _PyString_Eq
              #define PyBytes_Format PyString_Format
              #define _PyBytes_FormatLong _PyString_FormatLong
              #define PyBytes_DecodeEscape PyString_DecodeEscape
              #define _PyBytes_Join _PyString_Join
              #define PyBytes_Decode PyString_Decode
              #define PyBytes_Encode PyString_Encode
              #define PyBytes_AsEncodedObject PyString_AsEncodedObject
              #define PyBytes_AsEncodedString PyString_AsEncodedString
              #define PyBytes_AsDecodedObject PyString_AsDecodedObject
              #define PyBytes_AsDecodedString PyString_AsDecodedString
              #define PyBytes_AsStringAndSize PyString_AsStringAndSize
              #define _PyBytes_InsertThousandsGrouping _PyString_InsertThousandsGrouping
              #endif /* PY_VERSION_HEX */
              #if (PY_VERSION_HEX < 0x02050000)
              /* Definitions to get compatibility with python 2.4 and earlier which
                 does not have Py_ssize_t. See also PEP 353.
                 Note: msvc (8 or earlier) does not have ssize_t, so we use Py_ssize_t.
              */
              typedef int Py_ssize_t;
              typedef Py_ssize_t (*lenfunc)(PyObject *);
              typedef PyObject *(*ssizeargfunc)(PyObject *, Py_ssize_t);
              #define PyInt_FromSsize_t PyInt_FromLong
              #if !defined(PY_SSIZE_T_MIN)
              #define PY_SSIZE_T_MAX INT_MAX
              #define PY_SSIZE_T_MIN INT_MIN
              #endif
              #endif
              #ifdef _WIN32
              #ifdef _MSC_VER
              /* msvc 6.0 has problems */
              #define inline __inline
              typedef signed char int8_t;
              typedef short int16_t;
              typedef long int32_t;
              typedef __int64 int64_t;
              typedef unsigned char uint8_t;
              typedef unsigned short uint16_t;
              typedef unsigned long uint32_t;
              typedef unsigned __int64 uint64_t;
              #else
              #include <stdint.h>
              #endif
              #else
              /* not windows */
              #include <sys/types.h>
              #if defined __BEOS__ && !defined __HAIKU__
              #include <ByteOrder.h>
              #else
              #include <arpa/inet.h>
              #endif
              #include <inttypes.h>
              #endif
              #if defined __hpux || defined __SUNPRO_C || defined _AIX
              #define inline
              #endif
              #ifdef __linux
              #define inline __inline
              #endif
+             typedef struct {
+             	PyObject_HEAD
+             	char state;
+             	int mode;
+             	int size;
+             	int mtime;
+             } dirstateTupleObject;
+             PyTypeObject dirstateTupleType;
+             #define dirstate_tuple_check(op) (Py_TYPE(op) == &dirstateTupleType)
              static inline uint32_t getbe32(const char *c)
              {
              	const unsigned char *d = (const unsigned char *)c;
              	return ((d[0] << 24) |
              		(d[1] << 16) |
              		(d[2] << 8) |
              		(d[3]));
              }
              static inline void putbe32(uint32_t x, char *c)
              {
              	c[0] = (x >> 24) & 0xff;
              	c[1] = (x >> 16) & 0xff;
              	c[2] = (x >> 8) & 0xff;
              	c[3] = (x) & 0xff;
              }
              #endif /* _HG_UTIL_H_ */

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages