upstream/mercurial-mirror Commit - r5450:c728424d

revlog: fix caching of buffer objects

Matt Mackall -

r5450:c728424d default

parent child

mercurial/changelog.py

0 +1 -1

              # changelog.py - changelog class for mercurial
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms
              # of the GNU General Public License, incorporated herein by reference.
              from revlog import *
              from i18n import _
              import os, time, util
              def _string_escape(text):
                  """
                  >>> d = {'nl': chr(10), 'bs': chr(92), 'cr': chr(13), 'nul': chr(0)}
                  >>> s = "ab%(nl)scd%(bs)s%(bs)sn%(nul)sab%(cr)scd%(bs)s%(nl)s" % d
                  >>> s
                  'ab\\ncd\\\\\\\\n\\x00ab\\rcd\\\\\\n'
                  >>> res = _string_escape(s)
                  >>> s == _string_unescape(res)
                  True
                  """
                  # subset of the string_escape codec
                  text = text.replace('\\', '\\\\').replace('\n', '\\n').replace('\r', '\\r')
                  return text.replace('\0', '\\0')
              def _string_unescape(text):
                  return text.decode('string_escape')
              class appender:
                  '''the changelog index must be update last on disk, so we use this class
                  to delay writes to it'''
                  def __init__(self, fp, buf):
                      self.data = buf
                      self.fp = fp
                      self.offset = fp.tell()
                      self.size = util.fstat(fp).st_size
                  def end(self):
                      return self.size + len("".join(self.data))
                  def tell(self):
                      return self.offset
                  def flush(self):
                      pass
                  def close(self):
                      self.fp.close()
                  def seek(self, offset, whence=0):
                      '''virtual file offset spans real file and data'''
                      if whence == 0:
                          self.offset = offset
                      elif whence == 1:
                          self.offset += offset
                      elif whence == 2:
                          self.offset = self.end() + offset
                      if self.offset < self.size:
                          self.fp.seek(self.offset)
                  def read(self, count=-1):
                      '''only trick here is reads that span real file and data'''
                      ret = ""
                      if self.offset < self.size:
                          s = self.fp.read(count)
                          ret = s
                          self.offset += len(s)
                          if count > 0:
                              count -= len(s)
                      if count != 0:
                          doff = self.offset - self.size
                          self.data.insert(0, "".join(self.data))
                          del self.data[1:]
                          s = self.data[0][doff:doff+count]
                          self.offset += len(s)
                          ret += s
                      return ret
                  def write(self, s):
-                     self.data.append(s)
+                     self.data.append(str(s))
                      self.offset += len(s)
              class changelog(revlog):
                  def __init__(self, opener):
                      revlog.__init__(self, opener, "00changelog.i")
                  def delayupdate(self):
                      "delay visibility of index updates to other readers"
                      self._realopener = self.opener
                      self.opener = self._delayopener
                      self._delaycount = self.count()
                      self._delaybuf = []
                      self._delayname = None
                  def finalize(self, tr):
                      "finalize index updates"
                      self.opener = self._realopener
                      # move redirected index data back into place
                      if self._delayname:
                          util.rename(self._delayname + ".a", self._delayname)
                      elif self._delaybuf:
                          fp = self.opener(self.indexfile, 'a')
                          fp.write("".join(self._delaybuf))
                          fp.close()
                          del self._delaybuf
                      # split when we're done
                      self.checkinlinesize(tr)
                  def _delayopener(self, name, mode='r'):
                      fp = self._realopener(name, mode)
                      # only divert the index
                      if not name == self.indexfile:
                          return fp
                      # if we're doing an initial clone, divert to another file
                      if self._delaycount == 0:
                          self._delayname = fp.name
                          return self._realopener(name + ".a", mode)
                      # otherwise, divert to memory
                      return appender(fp, self._delaybuf)
                  def checkinlinesize(self, tr, fp=None):
                      if self.opener == self._delayopener:
                          return
                      return revlog.checkinlinesize(self, tr, fp)
                  def decode_extra(self, text):
                      extra = {}
                      for l in text.split('\0'):
                          if not l:
                              continue
                          k, v = _string_unescape(l).split(':', 1)
                          extra[k] = v
                      return extra
                  def encode_extra(self, d):
                      # keys must be sorted to produce a deterministic changelog entry
                      keys = d.keys()
                      keys.sort()
                      items = [_string_escape('%s:%s' % (k, d[k])) for k in keys]
                      return "\0".join(items)
                  def extract(self, text):
                      """
                      format used:
                      nodeid\n        : manifest node in ascii
                      user\n          : user, no \n or \r allowed
                      time tz extra\n : date (time is int or float, timezone is int)
                                      : extra is metadatas, encoded and separated by '\0'
                                      : older versions ignore it
                      files\n\n       : files modified by the cset, no \n or \r allowed
                      (.*)            : comment (free text, ideally utf-8)
                      changelog v0 doesn't use extra
                      """
                      if not text:
                          return (nullid, "", (0, 0), [], "", {'branch': 'default'})
                      last = text.index("\n\n")
                      desc = util.tolocal(text[last + 2:])
                      l = text[:last].split('\n')
                      manifest = bin(l[0])
                      user = util.tolocal(l[1])
                      extra_data = l[2].split(' ', 2)
                      if len(extra_data) != 3:
                          time = float(extra_data.pop(0))
                          try:
                              # various tools did silly things with the time zone field.
                              timezone = int(extra_data[0])
                          except:
                              timezone = 0
                          extra = {}
                      else:
                          time, timezone, extra = extra_data
                          time, timezone = float(time), int(timezone)
                          extra = self.decode_extra(extra)
                      if not extra.get('branch'):
                          extra['branch'] = 'default'
                      files = l[3:]
                      return (manifest, user, (time, timezone), files, desc, extra)
                  def read(self, node):
                      return self.extract(self.revision(node))
                  def add(self, manifest, list, desc, transaction, p1=None, p2=None,
                                user=None, date=None, extra={}):
                      user, desc = util.fromlocal(user), util.fromlocal(desc)
                      if date:
                          parseddate = "%d %d" % util.parsedate(date)
                      else:
                          parseddate = "%d %d" % util.makedate()
                      if extra and extra.get("branch") in ("default", ""):
                          del extra["branch"]
                      if extra:
                          extra = self.encode_extra(extra)
                          parseddate = "%s %s" % (parseddate, extra)
                      list.sort()
                      l = [hex(manifest), user, parseddate] + list + ["", desc]
                      text = "\n".join(l)
                      return self.addrevision(text, transaction, self.count(), p1, p2)

mercurial/revlog.py

0 +2 -2

              """
              revlog.py - storage back-end for mercurial
              This provides efficient delta storage with O(1) retrieve and append
              and O(changes) merge between branches
              Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              This software may be used and distributed according to the terms
              of the GNU General Public License, incorporated herein by reference.
              """
              from node import *
              from i18n import _
              import binascii, changegroup, errno, ancestor, mdiff, os
              import sha, struct, util, zlib
              _pack = struct.pack
              _unpack = struct.unpack
              _compress = zlib.compress
              _decompress = zlib.decompress
              _sha = sha.new
              # revlog flags
              REVLOGV0 = 0
              REVLOGNG = 1
              REVLOGNGINLINEDATA = (1 << 16)
              REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
              REVLOG_DEFAULT_FORMAT = REVLOGNG
              REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
              class RevlogError(Exception):
                  pass
              class LookupError(RevlogError):
                  pass
              def getoffset(q):
                  return int(q >> 16)
              def gettype(q):
                  return int(q & 0xFFFF)
              def offset_type(offset, type):
                  return long(long(offset) << 16 | type)
              def hash(text, p1, p2):
                  """generate a hash from the given text and its parent hashes
                  This hash combines both the current file contents and its history
                  in a manner that makes it easy to distinguish nodes with the same
                  content in the revision graph.
                  """
                  l = [p1, p2]
                  l.sort()
                  s = _sha(l[0])
                  s.update(l[1])
                  s.update(text)
                  return s.digest()
              def compress(text):
                  """ generate a possibly-compressed representation of text """
                  if not text:
                      return ("", text)
                  if len(text) < 44:
                      if text[0] == '\0':
                          return ("", text)
                      return ('u', text)
                  bin = _compress(text)
                  if len(bin) > len(text):
                      if text[0] == '\0':
                          return ("", text)
                      return ('u', text)
                  return ("", bin)
              def decompress(bin):
                  """ decompress the given input """
                  if not bin:
                      return bin
                  t = bin[0]
                  if t == '\0':
                      return bin
                  if t == 'x':
                      return _decompress(bin)
                  if t == 'u':
                      return bin[1:]
                  raise RevlogError(_("unknown compression type %r") % t)
              class lazyparser(object):
                  """
                  this class avoids the need to parse the entirety of large indices
                  """
                  # lazyparser is not safe to use on windows if win32 extensions not
                  # available. it keeps file handle open, which make it not possible
                  # to break hardlinks on local cloned repos.
                  safe_to_use = os.name != 'nt' or (not util.is_win_9x() and
                                                    hasattr(util, 'win32api'))
                  def __init__(self, dataf, size):
                      self.dataf = dataf
                      self.s = struct.calcsize(indexformatng)
                      self.datasize = size
                      self.l = size/self.s
                      self.index = [None] * self.l
                      self.map = {nullid: nullrev}
                      self.allmap = 0
                      self.all = 0
                      self.mapfind_count = 0
                  def loadmap(self):
                      """
                      during a commit, we need to make sure the rev being added is
                      not a duplicate.  This requires loading the entire index,
                      which is fairly slow.  loadmap can load up just the node map,
                      which takes much less time.
                      """
                      if self.allmap:
                          return
                      end = self.datasize
                      self.allmap = 1
                      cur = 0
                      count = 0
                      blocksize = self.s * 256
                      self.dataf.seek(0)
                      while cur < end:
                          data = self.dataf.read(blocksize)
                          off = 0
                          for x in xrange(256):
                              n = data[off + ngshaoffset:off + ngshaoffset + 20]
                              self.map[n] = count
                              count += 1
                              if count >= self.l:
                                  break
                              off += self.s
                          cur += blocksize
                  def loadblock(self, blockstart, blocksize, data=None):
                      if self.all:
                          return
                      if data is None:
                          self.dataf.seek(blockstart)
                          if blockstart + blocksize > self.datasize:
                              # the revlog may have grown since we've started running,
                              # but we don't have space in self.index for more entries.
                              # limit blocksize so that we don't get too much data.
                              blocksize = max(self.datasize - blockstart, 0)
                          data = self.dataf.read(blocksize)
                      lend = len(data) / self.s
                      i = blockstart / self.s
                      off = 0
                      # lazyindex supports __delitem__
                      if lend > len(self.index) - i:
                          lend = len(self.index) - i
                      for x in xrange(lend):
                          if self.index[i + x] == None:
                              b = data[off : off + self.s]
                              self.index[i + x] = b
                              n = b[ngshaoffset:ngshaoffset + 20]
                              self.map[n] = i + x
                          off += self.s
                  def findnode(self, node):
                      """search backwards through the index file for a specific node"""
                      if self.allmap:
                          return None
                      # hg log will cause many many searches for the manifest
                      # nodes.  After we get called a few times, just load the whole
                      # thing.
                      if self.mapfind_count > 8:
                          self.loadmap()
                          if node in self.map:
                              return node
                          return None
                      self.mapfind_count += 1
                      last = self.l - 1
                      while self.index[last] != None:
                          if last == 0:
                              self.all = 1
                              self.allmap = 1
                              return None
                          last -= 1
                      end = (last + 1) * self.s
                      blocksize = self.s * 256
                      while end >= 0:
                          start = max(end - blocksize, 0)
                          self.dataf.seek(start)
                          data = self.dataf.read(end - start)
                          findend = end - start
                          while True:
                              # we're searching backwards, so we have to make sure
                              # we don't find a changeset where this node is a parent
                              off = data.find(node, 0, findend)
                              findend = off
                              if off >= 0:
                                  i = off / self.s
                                  off = i * self.s
                                  n = data[off + ngshaoffset:off + ngshaoffset + 20]
                                  if n == node:
                                      self.map[n] = i + start / self.s
                                      return node
                              else:
                                  break
                          end -= blocksize
                      return None
                  def loadindex(self, i=None, end=None):
                      if self.all:
                          return
                      all = False
                      if i == None:
                          blockstart = 0
                          blocksize = (65536 / self.s) * self.s
                          end = self.datasize
                          all = True
                      else:
                          if end:
                              blockstart = i * self.s
                              end = end * self.s
                              blocksize = end - blockstart
                          else:
                              blockstart = (i & ~1023) * self.s
                              blocksize = self.s * 1024
                              end = blockstart + blocksize
                      while blockstart < end:
                          self.loadblock(blockstart, blocksize)
                          blockstart += blocksize
                      if all:
                          self.all = True
              class lazyindex(object):
                  """a lazy version of the index array"""
                  def __init__(self, parser):
                      self.p = parser
                  def __len__(self):
                      return len(self.p.index)
                  def load(self, pos):
                      if pos < 0:
                          pos += len(self.p.index)
                      self.p.loadindex(pos)
                      return self.p.index[pos]
                  def __getitem__(self, pos):
                      return _unpack(indexformatng, self.p.index[pos] or self.load(pos))
                  def __setitem__(self, pos, item):
                      self.p.index[pos] = _pack(indexformatng, *item)
                  def __delitem__(self, pos):
                      del self.p.index[pos]
                  def insert(self, pos, e):
                      self.p.index.insert(pos, _pack(indexformatng, *e))
                  def append(self, e):
                      self.p.index.append(_pack(indexformatng, *e))
              class lazymap(object):
                  """a lazy version of the node map"""
                  def __init__(self, parser):
                      self.p = parser
                  def load(self, key):
                      n = self.p.findnode(key)
                      if n == None:
                          raise KeyError(key)
                  def __contains__(self, key):
                      if key in self.p.map:
                          return True
                      self.p.loadmap()
                      return key in self.p.map
                  def __iter__(self):
                      yield nullid
                      for i in xrange(self.p.l):
                          ret = self.p.index[i]
                          if not ret:
                              self.p.loadindex(i)
                              ret = self.p.index[i]
                          if isinstance(ret, str):
                              ret = _unpack(indexformatng, ret)
                          yield ret[7]
                  def __getitem__(self, key):
                      try:
                          return self.p.map[key]
                      except KeyError:
                          try:
                              self.load(key)
                              return self.p.map[key]
                          except KeyError:
                              raise KeyError("node " + hex(key))
                  def __setitem__(self, key, val):
                      self.p.map[key] = val
                  def __delitem__(self, key):
                      del self.p.map[key]
              indexformatv0 = ">4l20s20s20s"
              v0shaoffset = 56
              class revlogoldio(object):
                  def __init__(self):
                      self.size = struct.calcsize(indexformatv0)
                  def parseindex(self, fp, inline):
                      s = self.size
                      index = []
                      nodemap =  {nullid: nullrev}
                      n = off = 0
                      data = fp.read()
                      l = len(data)
                      while off + s <= l:
                          cur = data[off:off + s]
                          off += s
                          e = _unpack(indexformatv0, cur)
                          # transform to revlogv1 format
                          e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                                nodemap[e[4]], nodemap[e[5]], e[6])
                          index.append(e2)
                          nodemap[e[6]] = n
                          n += 1
                      return index, nodemap, None
                  def packentry(self, entry, node, version, rev):
                      e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                            node(entry[5]), node(entry[6]), entry[7])
                      return _pack(indexformatv0, *e2)
              # index ng:
              # 6 bytes offset
              # 2 bytes flags
              # 4 bytes compressed length
              # 4 bytes uncompressed length
              # 4 bytes: base rev
              # 4 bytes link rev
              # 4 bytes parent 1 rev
              # 4 bytes parent 2 rev
              # 32 bytes: nodeid
              indexformatng = ">Qiiiiii20s12x"
              ngshaoffset = 32
              versionformat = ">I"
              class revlogio(object):
                  def __init__(self):
                      self.size = struct.calcsize(indexformatng)
                  def parseindex(self, fp, inline):
                      try:
                          size = util.fstat(fp).st_size
                      except AttributeError:
                          size = 0
                      if lazyparser.safe_to_use and not inline and size > 1000000:
                          # big index, let's parse it on demand
                          parser = lazyparser(fp, size)
                          index = lazyindex(parser)
                          nodemap = lazymap(parser)
                          e = list(index[0])
                          type = gettype(e[0])
                          e[0] = offset_type(0, type)
                          index[0] = e
                          return index, nodemap, None
                      s = self.size
                      cache = None
                      index = []
                      nodemap =  {nullid: nullrev}
                      n = off = 0
                      # if we're not using lazymap, always read the whole index
                      data = fp.read()
                      l = len(data) - s
                      append = index.append
                      if inline:
                          cache = (0, data)
                          while off <= l:
                              e = _unpack(indexformatng, data[off:off + s])
                              nodemap[e[7]] = n
                              append(e)
                              n += 1
                              if e[1] < 0:
                                  break
                              off += e[1] + s
                      else:
                          while off <= l:
                              e = _unpack(indexformatng, data[off:off + s])
                              nodemap[e[7]] = n
                              append(e)
                              n += 1
                              off += s
                      e = list(index[0])
                      type = gettype(e[0])
                      e[0] = offset_type(0, type)
                      index[0] = e
                      return index, nodemap, cache
                  def packentry(self, entry, node, version, rev):
                      p = _pack(indexformatng, *entry)
                      if rev == 0:
                          p = _pack(versionformat, version) + p[4:]
                      return p
              class revlog(object):
                  """
                  the underlying revision storage object
                  A revlog consists of two parts, an index and the revision data.
                  The index is a file with a fixed record size containing
                  information on each revision, includings its nodeid (hash), the
                  nodeids of its parents, the position and offset of its data within
                  the data file, and the revision it's based on. Finally, each entry
                  contains a linkrev entry that can serve as a pointer to external
                  data.
                  The revision data itself is a linear collection of data chunks.
                  Each chunk represents a revision and is usually represented as a
                  delta against the previous chunk. To bound lookup time, runs of
                  deltas are limited to about 2 times the length of the original
                  version data. This makes retrieval of a version proportional to
                  its size, or O(1) relative to the number of revisions.
                  Both pieces of the revlog are written to in an append-only
                  fashion, which means we never need to rewrite a file to insert or
                  remove data, and can use some simple techniques to avoid the need
                  for locking while reading.
                  """
                  def __init__(self, opener, indexfile):
                      """
                      create a revlog object
                      opener is a function that abstracts the file opening operation
                      and can be used to implement COW semantics or the like.
                      """
                      self.indexfile = indexfile
                      self.datafile = indexfile[:-2] + ".d"
                      self.opener = opener
                      self._cache = None
                      self._chunkcache = None
                      self.nodemap = {nullid: nullrev}
                      self.index = []
                      v = REVLOG_DEFAULT_VERSION
                      if hasattr(opener, "defversion"):
                          v = opener.defversion
                          if v & REVLOGNG:
                              v |= REVLOGNGINLINEDATA
                      i = ""
                      try:
                          f = self.opener(self.indexfile)
                          i = f.read(4)
                          f.seek(0)
                          if len(i) > 0:
                              v = struct.unpack(versionformat, i)[0]
                      except IOError, inst:
                          if inst.errno != errno.ENOENT:
                              raise
                      self.version = v
                      self._inline = v & REVLOGNGINLINEDATA
                      flags = v & ~0xFFFF
                      fmt = v & 0xFFFF
                      if fmt == REVLOGV0 and flags:
                          raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                            % (self.indexfile, flags >> 16))
                      elif fmt == REVLOGNG and flags & ~REVLOGNGINLINEDATA:
                          raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                            % (self.indexfile, flags >> 16))
                      elif fmt > REVLOGNG:
                          raise RevlogError(_("index %s unknown format %d")
                                            % (self.indexfile, fmt))
                      self._io = revlogio()
                      if self.version == REVLOGV0:
                          self._io = revlogoldio()
                      if i:
                          d = self._io.parseindex(f, self._inline)
                          self.index, self.nodemap, self._chunkcache = d
                      # add the magic null revision at -1
                      self.index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                  def _loadindex(self, start, end):
                      """load a block of indexes all at once from the lazy parser"""
                      if isinstance(self.index, lazyindex):
                          self.index.p.loadindex(start, end)
                  def _loadindexmap(self):
                      """loads both the map and the index from the lazy parser"""
                      if isinstance(self.index, lazyindex):
                          p = self.index.p
                          p.loadindex()
                          self.nodemap = p.map
                  def _loadmap(self):
                      """loads the map from the lazy parser"""
                      if isinstance(self.nodemap, lazymap):
                          self.nodemap.p.loadmap()
                          self.nodemap = self.nodemap.p.map
                  def tip(self):
                      return self.node(len(self.index) - 2)
                  def count(self):
                      return len(self.index) - 1
                  def rev(self, node):
                      try:
                          return self.nodemap[node]
                      except KeyError:
                          raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))
                  def node(self, rev):
                      return self.index[rev][7]
                  def linkrev(self, node):
                      return self.index[self.rev(node)][4]
                  def parents(self, node):
                      d = self.index[self.rev(node)][5:7]
                      return (self.node(d[0]), self.node(d[1]))
                  def parentrevs(self, rev):
                      return self.index[rev][5:7]
                  def start(self, rev):
                      return int(self.index[rev][0] >> 16)
                  def end(self, rev):
                      return self.start(rev) + self.length(rev)
                  def length(self, rev):
                      return self.index[rev][1]
                  def base(self, rev):
                      return self.index[rev][3]
                  def size(self, rev):
                      """return the length of the uncompressed text for a given revision"""
                      l = self.index[rev][2]
                      if l >= 0:
                          return l
                      t = self.revision(self.node(rev))
                      return len(t)
                      # alternate implementation, The advantage to this code is it
                      # will be faster for a single revision.  But, the results are not
                      # cached, so finding the size of every revision will be slower.
                      """
                      if self.cache and self.cache[1] == rev:
                          return len(self.cache[2])
                      base = self.base(rev)
                      if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                          base = self.cache[1]
                          text = self.cache[2]
                      else:
                          text = self.revision(self.node(base))
                      l = len(text)
                      for x in xrange(base + 1, rev + 1):
                          l = mdiff.patchedsize(l, self.chunk(x))
                      return l
                      """
                  def reachable(self, node, stop=None):
                      """return a hash of all nodes ancestral to a given node, including
                       the node itself, stopping when stop is matched"""
                      reachable = {}
                      visit = [node]
                      reachable[node] = 1
                      if stop:
                          stopn = self.rev(stop)
                      else:
                          stopn = 0
                      while visit:
                          n = visit.pop(0)
                          if n == stop:
                              continue
                          if n == nullid:
                              continue
                          for p in self.parents(n):
                              if self.rev(p) < stopn:
                                  continue
                              if p not in reachable:
                                  reachable[p] = 1
                                  visit.append(p)
                      return reachable
                  def nodesbetween(self, roots=None, heads=None):
                      """Return a tuple containing three elements. Elements 1 and 2 contain
                      a final list bases and heads after all the unreachable ones have been
                      pruned.  Element 0 contains a topologically sorted list of all
                      nodes that satisfy these constraints:
 . All nodes must be descended from a node in roots (the nodes on
                         roots are considered descended from themselves).
 . All nodes must also be ancestors of a node in heads (the nodes in
                         heads are considered to be their own ancestors).
                      If roots is unspecified, nullid is assumed as the only root.
                      If heads is unspecified, it is taken to be the output of the
                      heads method (i.e. a list of all nodes in the repository that
                      have no children)."""
                      nonodes = ([], [], [])
                      if roots is not None:
                          roots = list(roots)
                          if not roots:
                              return nonodes
                          lowestrev = min([self.rev(n) for n in roots])
                      else:
                          roots = [nullid] # Everybody's a descendent of nullid
                          lowestrev = nullrev
                      if (lowestrev == nullrev) and (heads is None):
                          # We want _all_ the nodes!
                          return ([self.node(r) for r in xrange(0, self.count())],
                                  [nullid], list(self.heads()))
                      if heads is None:
                          # All nodes are ancestors, so the latest ancestor is the last
                          # node.
                          highestrev = self.count() - 1
                          # Set ancestors to None to signal that every node is an ancestor.
                          ancestors = None
                          # Set heads to an empty dictionary for later discovery of heads
                          heads = {}
                      else:
                          heads = list(heads)
                          if not heads:
                              return nonodes
                          ancestors = {}
                          # Turn heads into a dictionary so we can remove 'fake' heads.
                          # Also, later we will be using it to filter out the heads we can't
                          # find from roots.
                          heads = dict.fromkeys(heads, 0)
                          # Start at the top and keep marking parents until we're done.
                          nodestotag = heads.keys()
                          # Remember where the top was so we can use it as a limit later.
                          highestrev = max([self.rev(n) for n in nodestotag])
                          while nodestotag:
                              # grab a node to tag
                              n = nodestotag.pop()
                              # Never tag nullid
                              if n == nullid:
                                  continue
                              # A node's revision number represents its place in a
                              # topologically sorted list of nodes.
                              r = self.rev(n)
                              if r >= lowestrev:
                                  if n not in ancestors:
                                      # If we are possibly a descendent of one of the roots
                                      # and we haven't already been marked as an ancestor
                                      ancestors[n] = 1 # Mark as ancestor
                                      # Add non-nullid parents to list of nodes to tag.
                                      nodestotag.extend([p for p in self.parents(n) if
                                                         p != nullid])
                                  elif n in heads: # We've seen it before, is it a fake head?
                                      # So it is, real heads should not be the ancestors of
                                      # any other heads.
                                      heads.pop(n)
                          if not ancestors:
                              return nonodes
                          # Now that we have our set of ancestors, we want to remove any
                          # roots that are not ancestors.
                          # If one of the roots was nullid, everything is included anyway.
                          if lowestrev > nullrev:
                              # But, since we weren't, let's recompute the lowest rev to not
                              # include roots that aren't ancestors.
                              # Filter out roots that aren't ancestors of heads
                              roots = [n for n in roots if n in ancestors]
                              # Recompute the lowest revision
                              if roots:
                                  lowestrev = min([self.rev(n) for n in roots])
                              else:
                                  # No more roots?  Return empty list
                                  return nonodes
                          else:
                              # We are descending from nullid, and don't need to care about
                              # any other roots.
                              lowestrev = nullrev
                              roots = [nullid]
                      # Transform our roots list into a 'set' (i.e. a dictionary where the
                      # values don't matter.
                      descendents = dict.fromkeys(roots, 1)
                      # Also, keep the original roots so we can filter out roots that aren't
                      # 'real' roots (i.e. are descended from other roots).
                      roots = descendents.copy()
                      # Our topologically sorted list of output nodes.
                      orderedout = []
                      # Don't start at nullid since we don't want nullid in our output list,
                      # and if nullid shows up in descedents, empty parents will look like
                      # they're descendents.
                      for r in xrange(max(lowestrev, 0), highestrev + 1):
                          n = self.node(r)
                          isdescendent = False
                          if lowestrev == nullrev:  # Everybody is a descendent of nullid
                              isdescendent = True
                          elif n in descendents:
                              # n is already a descendent
                              isdescendent = True
                              # This check only needs to be done here because all the roots
                              # will start being marked is descendents before the loop.
                              if n in roots:
                                  # If n was a root, check if it's a 'real' root.
                                  p = tuple(self.parents(n))
                                  # If any of its parents are descendents, it's not a root.
                                  if (p[0] in descendents) or (p[1] in descendents):
                                      roots.pop(n)
                          else:
                              p = tuple(self.parents(n))
                              # A node is a descendent if either of its parents are
                              # descendents.  (We seeded the dependents list with the roots
                              # up there, remember?)
                              if (p[0] in descendents) or (p[1] in descendents):
                                  descendents[n] = 1
                                  isdescendent = True
                          if isdescendent and ((ancestors is None) or (n in ancestors)):
                              # Only include nodes that are both descendents and ancestors.
                              orderedout.append(n)
                              if (ancestors is not None) and (n in heads):
                                  # We're trying to figure out which heads are reachable
                                  # from roots.
                                  # Mark this head as having been reached
                                  heads[n] = 1
                              elif ancestors is None:
                                  # Otherwise, we're trying to discover the heads.
                                  # Assume this is a head because if it isn't, the next step
                                  # will eventually remove it.
                                  heads[n] = 1
                                  # But, obviously its parents aren't.
                                  for p in self.parents(n):
                                      heads.pop(p, None)
                      heads = [n for n in heads.iterkeys() if heads[n] != 0]
                      roots = roots.keys()
                      assert orderedout
                      assert roots
                      assert heads
                      return (orderedout, roots, heads)
                  def heads(self, start=None, stop=None):
                      """return the list of all nodes that have no children
                      if start is specified, only heads that are descendants of
                      start will be returned
                      if stop is specified, it will consider all the revs from stop
                      as if they had no children
                      """
                      if start is None and stop is None:
                          count = self.count()
                          if not count:
                              return [nullid]
                          ishead = [1] * (count + 1)
                          index = self.index
                          for r in xrange(count):
                              e = index[r]
                              ishead[e[5]] = ishead[e[6]] = 0
                          return [self.node(r) for r in xrange(count) if ishead[r]]
                      if start is None:
                          start = nullid
                      if stop is None:
                          stop = []
                      stoprevs = dict.fromkeys([self.rev(n) for n in stop])
                      startrev = self.rev(start)
                      reachable = {startrev: 1}
                      heads = {startrev: 1}
                      parentrevs = self.parentrevs
                      for r in xrange(startrev + 1, self.count()):
                          for p in parentrevs(r):
                              if p in reachable:
                                  if r not in stoprevs:
                                      reachable[r] = 1
                                  heads[r] = 1
                              if p in heads and p not in stoprevs:
                                  del heads[p]
                      return [self.node(r) for r in heads]
                  def children(self, node):
                      """find the children of a given node"""
                      c = []
                      p = self.rev(node)
                      for r in range(p + 1, self.count()):
                          prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                          if prevs:
                              for pr in prevs:
                                  if pr == p:
                                      c.append(self.node(r))
                          elif p == nullrev:
                              c.append(self.node(r))
                      return c
                  def _match(self, id):
                      if isinstance(id, (long, int)):
                          # rev
                          return self.node(id)
                      if len(id) == 20:
                          # possibly a binary node
                          # odds of a binary node being all hex in ASCII are 1 in 10**25
                          try:
                              node = id
                              r = self.rev(node) # quick search the index
                              return node
                          except LookupError:
                              pass # may be partial hex id
                      try:
                          # str(rev)
                          rev = int(id)
                          if str(rev) != id:
                              raise ValueError
                          if rev < 0:
                              rev = self.count() + rev
                          if rev < 0 or rev >= self.count():
                              raise ValueError
                          return self.node(rev)
                      except (ValueError, OverflowError):
                          pass
                      if len(id) == 40:
                          try:
                              # a full hex nodeid?
                              node = bin(id)
                              r = self.rev(node)
                              return node
                          except TypeError:
                              pass
                  def _partialmatch(self, id):
                      if len(id) < 40:
                          try:
                              # hex(node)[:...]
                              bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits
                              node = None
                              for n in self.nodemap:
                                  if n.startswith(bin_id) and hex(n).startswith(id):
                                      if node is not None:
                                          raise LookupError(_("Ambiguous identifier"))
                                      node = n
                              if node is not None:
                                  return node
                          except TypeError:
                              pass
                  def lookup(self, id):
                      """locate a node based on:
                          - revision number or str(revision number)
                          - nodeid or subset of hex nodeid
                      """
                      n = self._match(id)
                      if n is not None:
                          return n
                      n = self._partialmatch(id)
                      if n:
                          return n
                      raise LookupError(_("No match found"))
                  def cmp(self, node, text):
                      """compare text with a given file revision"""
                      p1, p2 = self.parents(node)
                      return hash(text, p1, p2) != node
                  def chunk(self, rev, df=None):
                      def loadcache(df):
                          if not df:
                              if self._inline:
                                  df = self.opener(self.indexfile)
                              else:
                                  df = self.opener(self.datafile)
                          df.seek(start)
                          self._chunkcache = (start, df.read(cache_length))
                      start, length = self.start(rev), self.length(rev)
                      if self._inline:
                          start += (rev + 1) * self._io.size
                      end = start + length
                      offset = 0
                      if not self._chunkcache:
                          cache_length = max(65536, length)
                          loadcache(df)
                      else:
                          cache_start = self._chunkcache[0]
                          cache_length = len(self._chunkcache[1])
                          cache_end = cache_start + cache_length
                          if start >= cache_start and end <= cache_end:
                              # it is cached
                              offset = start - cache_start
                          else:
                              cache_length = max(65536, length)
                              loadcache(df)
                      # avoid copying large chunks
                      c = self._chunkcache[1]
                      if cache_length != length:
                          c = c[offset:offset + length]
                      return decompress(c)
                  def delta(self, node):
                      """return or calculate a delta between a node and its predecessor"""
                      r = self.rev(node)
                      return self.revdiff(r - 1, r)
                  def revdiff(self, rev1, rev2):
                      """return or calculate a delta between two revisions"""
                      if rev1 + 1 == rev2 and self.base(rev1) == self.base(rev2):
                          return self.chunk(rev2)
                      return mdiff.textdiff(self.revision(self.node(rev1)),
                                            self.revision(self.node(rev2)))
                  def revision(self, node):
                      """return an uncompressed revision of a given"""
                      if node == nullid:
                          return ""
                      if self._cache and self._cache[0] == node:
-                         return self._cache[2]
+                         return str(self._cache[2])
                      # look up what we need to read
                      text = None
                      rev = self.rev(node)
                      base = self.base(rev)
                      # check rev flags
                      if self.index[rev][0] & 0xFFFF:
                          raise RevlogError(_('incompatible revision flag %x') %
                                            (self.index[rev][0] & 0xFFFF))
                      if self._inline:
                          # we probably have the whole chunk cached
                          df = None
                      else:
                          df = self.opener(self.datafile)
                      # do we have useful data cached?
                      if self._cache and self._cache[1] >= base and self._cache[1] < rev:
                          base = self._cache[1]
-                         text = self._cache[2]
+                         text = str(self._cache[2])
                          self._loadindex(base, rev + 1)
                      else:
                          self._loadindex(base, rev + 1)
                          text = self.chunk(base, df=df)
                      bins = [self.chunk(r, df) for r in xrange(base + 1, rev + 1)]
                      text = mdiff.patches(text, bins)
                      p1, p2 = self.parents(node)
                      if node != hash(text, p1, p2):
                          raise RevlogError(_("integrity check failed on %s:%d")
                                            % (self.datafile, rev))
                      self._cache = (node, rev, text)
                      return text
                  def checkinlinesize(self, tr, fp=None):
                      if not self._inline:
                          return
                      if not fp:
                          fp = self.opener(self.indexfile, 'r')
                          fp.seek(0, 2)
                      size = fp.tell()
                      if size < 131072:
                          return
                      trinfo = tr.find(self.indexfile)
                      if trinfo == None:
                          raise RevlogError(_("%s not found in the transaction")
                                            % self.indexfile)
                      trindex = trinfo[2]
                      dataoff = self.start(trindex)
                      tr.add(self.datafile, dataoff)
                      df = self.opener(self.datafile, 'w')
                      calc = self._io.size
                      for r in xrange(self.count()):
                          start = self.start(r) + (r + 1) * calc
                          length = self.length(r)
                          fp.seek(start)
                          d = fp.read(length)
                          df.write(d)
                      fp.close()
                      df.close()
                      fp = self.opener(self.indexfile, 'w', atomictemp=True)
                      self.version &= ~(REVLOGNGINLINEDATA)
                      self._inline = False
                      for i in xrange(self.count()):
                          e = self._io.packentry(self.index[i], self.node, self.version, i)
                          fp.write(e)
                      # if we don't call rename, the temp file will never replace the
                      # real index
                      fp.rename()
                      tr.replace(self.indexfile, trindex * calc)
                      self._chunkcache = None
                  def addrevision(self, text, transaction, link, p1, p2, d=None):
                      """add a revision to the log
                      text - the revision data to add
                      transaction - the transaction object used for rollback
                      link - the linkrev data to add
                      p1, p2 - the parent nodeids of the revision
                      d - an optional precomputed delta
                      """
                      dfh = None
                      if not self._inline:
                          dfh = self.opener(self.datafile, "a")
                      ifh = self.opener(self.indexfile, "a+")
                      return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)
                  def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):
                      node = hash(text, p1, p2)
                      if node in self.nodemap:
                          return node
                      curr = self.count()
                      prev = curr - 1
                      base = self.base(prev)
                      offset = self.end(prev)
                      if curr:
                          if not d:
                              ptext = self.revision(self.node(prev))
                              d = mdiff.textdiff(ptext, text)
                          data = compress(d)
                          l = len(data[1]) + len(data[0])
                          dist = l + offset - self.start(base)
                      # full versions are inserted when the needed deltas
                      # become comparable to the uncompressed text
                      if not curr or dist > len(text) * 2:
                          data = compress(text)
                          l = len(data[1]) + len(data[0])
                          base = curr
                      e = (offset_type(offset, 0), l, len(text),
                           base, link, self.rev(p1), self.rev(p2), node)
                      self.index.insert(-1, e)
                      self.nodemap[node] = curr
                      entry = self._io.packentry(e, self.node, self.version, curr)
                      if not self._inline:
                          transaction.add(self.datafile, offset)
                          transaction.add(self.indexfile, curr * len(entry))
                          if data[0]:
                              dfh.write(data[0])
                          dfh.write(data[1])
                          dfh.flush()
                          ifh.write(entry)
                      else:
                          offset += curr * self._io.size
                          transaction.add(self.indexfile, offset, curr)
                          ifh.write(entry)
                          ifh.write(data[0])
                          ifh.write(data[1])
                          self.checkinlinesize(transaction, ifh)
                      self._cache = (node, curr, text)
                      return node
                  def ancestor(self, a, b):
                      """calculate the least common ancestor of nodes a and b"""
                      def parents(rev):
                          return [p for p in self.parentrevs(rev) if p != nullrev]
                      c = ancestor.ancestor(self.rev(a), self.rev(b), parents)
                      if c is None:
                          return nullid
                      return self.node(c)
                  def group(self, nodelist, lookup, infocollect=None):
                      """calculate a delta group
                      Given a list of changeset revs, return a set of deltas and
                      metadata corresponding to nodes. the first delta is
                      parent(nodes[0]) -> nodes[0] the receiver is guaranteed to
                      have this parent as it has all history before these
                      changesets. parent is parent[0]
                      """
                      revs = [self.rev(n) for n in nodelist]
                      # if we don't have any revisions touched by these changesets, bail
                      if not revs:
                          yield changegroup.closechunk()
                          return
                      # add the parent of the first rev
                      p = self.parents(self.node(revs[0]))[0]
                      revs.insert(0, self.rev(p))
                      # build deltas
                      for d in xrange(0, len(revs) - 1):
                          a, b = revs[d], revs[d + 1]
                          nb = self.node(b)
                          if infocollect is not None:
                              infocollect(nb)
                          p = self.parents(nb)
                          meta = nb + p[0] + p[1] + lookup(nb)
                          if a == -1:
                              d = self.revision(nb)
                              meta += mdiff.trivialdiffheader(len(d))
                          else:
                              d = self.revdiff(a, b)
                          yield changegroup.chunkheader(len(meta) + len(d))
                          yield meta
                          if len(d) > 2**20:
                              pos = 0
                              while pos < len(d):
                                  pos2 = pos + 2 ** 18
                                  yield d[pos:pos2]
                                  pos = pos2
                          else:
                              yield d
                      yield changegroup.closechunk()
                  def addgroup(self, revs, linkmapper, transaction, unique=0):
                      """
                      add a delta group
                      given a set of deltas, add them to the revision log. the
                      first delta is against its parent, which should be in our
                      log, the rest are against the previous delta.
                      """
                      #track the base of the current delta log
                      r = self.count()
                      t = r - 1
                      node = None
                      base = prev = nullrev
                      start = end = textlen = 0
                      if r:
                          end = self.end(t)
                      ifh = self.opener(self.indexfile, "a+")
                      isize = r * self._io.size
                      if self._inline:
                          transaction.add(self.indexfile, end + isize, r)
                          dfh = None
                      else:
                          transaction.add(self.indexfile, isize, r)
                          transaction.add(self.datafile, end)
                          dfh = self.opener(self.datafile, "a")
                      # loop through our set of deltas
                      chain = None
                      for chunk in revs:
                          node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                          link = linkmapper(cs)
                          if node in self.nodemap:
                              # this can happen if two branches make the same change
                              # if unique:
                              #    raise RevlogError(_("already have %s") % hex(node[:4]))
                              chain = node
                              continue
                          delta = buffer(chunk, 80)
                          del chunk
                          for p in (p1, p2):
                              if not p in self.nodemap:
                                  raise LookupError(_("unknown parent %s") % short(p))
                          if not chain:
                              # retrieve the parent revision of the delta chain
                              chain = p1
                              if not chain in self.nodemap:
                                  raise LookupError(_("unknown base %s") % short(chain[:4]))
                          # full versions are inserted when the needed deltas become
                          # comparable to the uncompressed text or when the previous
                          # version is not the one we have a delta against. We use
                          # the size of the previous full rev as a proxy for the
                          # current size.
                          if chain == prev:
                              cdelta = compress(delta)
                              cdeltalen = len(cdelta[0]) + len(cdelta[1])
                              textlen = mdiff.patchedsize(textlen, delta)
                          if chain != prev or (end - start + cdeltalen) > textlen * 2:
                              # flush our writes here so we can read it in revision
                              if dfh:
                                  dfh.flush()
                              ifh.flush()
                              text = self.revision(chain)
                              if len(text) == 0:
                                  # skip over trivial delta header
                                  text = buffer(delta, 12)
                              else:
                                  text = mdiff.patches(text, [delta])
                              del delta
                              chk = self._addrevision(text, transaction, link, p1, p2, None,
                                                      ifh, dfh)
                              if not dfh and not self._inline:
                                  # addrevision switched from inline to conventional
                                  # reopen the index
                                  dfh = self.opener(self.datafile, "a")
                                  ifh = self.opener(self.indexfile, "a")
                              if chk != node:
                                  raise RevlogError(_("consistency error adding group"))
                              textlen = len(text)
                          else:
                              e = (offset_type(end, 0), cdeltalen, textlen, base,
                                   link, self.rev(p1), self.rev(p2), node)
                              self.index.insert(-1, e)
                              self.nodemap[node] = r
                              entry = self._io.packentry(e, self.node, self.version, r)
                              if self._inline:
                                  ifh.write(entry)
                                  ifh.write(cdelta[0])
                                  ifh.write(cdelta[1])
                                  self.checkinlinesize(transaction, ifh)
                                  if not self._inline:
                                      dfh = self.opener(self.datafile, "a")
                                      ifh = self.opener(self.indexfile, "a")
                              else:
                                  dfh.write(cdelta[0])
                                  dfh.write(cdelta[1])
                                  ifh.write(entry)
                          t, r, chain, prev = r, r + 1, node, node
                          base = self.base(t)
                          start = self.start(base)
                          end = self.end(t)
                      return node
                  def strip(self, rev, minlink):
                      if self.count() == 0 or rev >= self.count():
                          return
                      if isinstance(self.index, lazyindex):
                          self._loadindexmap()
                      # When stripping away a revision, we need to make sure it
                      # does not actually belong to an older changeset.
                      # The minlink parameter defines the oldest revision
                      # we're allowed to strip away.
                      while minlink > self.index[rev][4]:
                          rev += 1
                          if rev >= self.count():
                              return
                      # first truncate the files on disk
                      end = self.start(rev)
                      if not self._inline:
                          df = self.opener(self.datafile, "a")
                          df.truncate(end)
                          end = rev * self._io.size
                      else:
                          end += rev * self._io.size
                      indexf = self.opener(self.indexfile, "a")
                      indexf.truncate(end)
                      # then reset internal state in memory to forget those revisions
                      self._cache = None
                      self._chunkcache = None
                      for x in xrange(rev, self.count()):
                          del self.nodemap[self.node(x)]
                      del self.index[rev:-1]
                  def checksize(self):
                      expected = 0
                      if self.count():
                          expected = max(0, self.end(self.count() - 1))
                      try:
                          f = self.opener(self.datafile)
                          f.seek(0, 2)
                          actual = f.tell()
                          dd = actual - expected
                      except IOError, inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          dd = 0
                      try:
                          f = self.opener(self.indexfile)
                          f.seek(0, 2)
                          actual = f.tell()
                          s = self._io.size
                          i = max(0, actual / s)
                          di = actual - (i * s)
                          if self._inline:
                              databytes = 0
                              for r in xrange(self.count()):
                                  databytes += max(0, self.length(r))
                              dd = 0
                              di = actual - self.count() * s - databytes
                      except IOError, inst:
                          if inst.errno != errno.ENOENT:
                              raise
                          di = 0
                      return (dd, di)

mercurial/util.py

0 +1 -1

              """
              util.py - Mercurial utility functions and platform specfic implementations
               Copyright 2005 K. Thananchayan <thananck@yahoo.com>
               Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
               Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
              This software may be used and distributed according to the terms
              of the GNU General Public License, incorporated herein by reference.
              This contains helper routines that are independent of the SCM core and hide
              platform-specific details from the core.
              """
              from i18n import _
              import cStringIO, errno, getpass, popen2, re, shutil, sys, tempfile, strutil
              import os, stat, threading, time, calendar, ConfigParser, locale, glob, osutil
              try:
                  set = set
                  frozenset = frozenset
              except NameError:
                  from sets import Set as set, ImmutableSet as frozenset
              try:
                  _encoding = os.environ.get("HGENCODING")
                  if sys.platform == 'darwin' and not _encoding:
                      # On darwin, getpreferredencoding ignores the locale environment and
                      # always returns mac-roman. We override this if the environment is
                      # not C (has been customized by the user).
                      locale.setlocale(locale.LC_CTYPE, '')
                      _encoding = locale.getlocale()[1]
                  if not _encoding:
                      _encoding = locale.getpreferredencoding() or 'ascii'
              except locale.Error:
                  _encoding = 'ascii'
              _encodingmode = os.environ.get("HGENCODINGMODE", "strict")
              _fallbackencoding = 'ISO-8859-1'
              def tolocal(s):
                  """
                  Convert a string from internal UTF-8 to local encoding
                  All internal strings should be UTF-8 but some repos before the
                  implementation of locale support may contain latin1 or possibly
                  other character sets. We attempt to decode everything strictly
                  using UTF-8, then Latin-1, and failing that, we use UTF-8 and
                  replace unknown characters.
                  """
                  for e in ('UTF-8', _fallbackencoding):
                      try:
                          u = s.decode(e) # attempt strict decoding
                          return u.encode(_encoding, "replace")
                      except LookupError, k:
                          raise Abort(_("%s, please check your locale settings") % k)
                      except UnicodeDecodeError:
                          pass
                  u = s.decode("utf-8", "replace") # last ditch
                  return u.encode(_encoding, "replace")
              def fromlocal(s):
                  """
                  Convert a string from the local character encoding to UTF-8
                  We attempt to decode strings using the encoding mode set by
                  HGENCODINGMODE, which defaults to 'strict'. In this mode, unknown
                  characters will cause an error message. Other modes include
                  'replace', which replaces unknown characters with a special
                  Unicode character, and 'ignore', which drops the character.
                  """
                  try:
                      return s.decode(_encoding, _encodingmode).encode("utf-8")
                  except UnicodeDecodeError, inst:
                      sub = s[max(0, inst.start-10):inst.start+10]
                      raise Abort("decoding near '%s': %s!" % (sub, inst))
                  except LookupError, k:
                      raise Abort(_("%s, please check your locale settings") % k)
              def locallen(s):
                  """Find the length in characters of a local string"""
                  return len(s.decode(_encoding, "replace"))
              def localsub(s, a, b=None):
                  try:
                      u = s.decode(_encoding, _encodingmode)
                      if b is not None:
                          u = u[a:b]
                      else:
                          u = u[:a]
                      return u.encode(_encoding, _encodingmode)
                  except UnicodeDecodeError, inst:
                      sub = s[max(0, inst.start-10), inst.start+10]
                      raise Abort(_("decoding near '%s': %s!") % (sub, inst))
              # used by parsedate
              defaultdateformats = (
                  '%Y-%m-%d %H:%M:%S',
                  '%Y-%m-%d %I:%M:%S%p',
                  '%Y-%m-%d %H:%M',
                  '%Y-%m-%d %I:%M%p',
                  '%Y-%m-%d',
                  '%m-%d',
                  '%m/%d',
                  '%m/%d/%y',
                  '%m/%d/%Y',
                  '%a %b %d %H:%M:%S %Y',
                  '%a %b %d %I:%M:%S%p %Y',
                  '%a, %d %b %Y %H:%M:%S',        #  GNU coreutils "/bin/date --rfc-2822"
                  '%b %d %H:%M:%S %Y',
                  '%b %d %I:%M:%S%p %Y',
                  '%b %d %H:%M:%S',
                  '%b %d %I:%M:%S%p',
                  '%b %d %H:%M',
                  '%b %d %I:%M%p',
                  '%b %d %Y',
                  '%b %d',
                  '%H:%M:%S',
                  '%I:%M:%SP',
                  '%H:%M',
                  '%I:%M%p',
              )
              extendeddateformats = defaultdateformats + (
                  "%Y",
                  "%Y-%m",
                  "%b",
                  "%b %Y",
                  )
              class SignalInterrupt(Exception):
                  """Exception raised on SIGTERM and SIGHUP."""
              # differences from SafeConfigParser:
              # - case-sensitive keys
              # - allows values that are not strings (this means that you may not
              #   be able to save the configuration to a file)
              class configparser(ConfigParser.SafeConfigParser):
                  def optionxform(self, optionstr):
                      return optionstr
                  def set(self, section, option, value):
                      return ConfigParser.ConfigParser.set(self, section, option, value)
                  def _interpolate(self, section, option, rawval, vars):
                      if not isinstance(rawval, basestring):
                          return rawval
                      return ConfigParser.SafeConfigParser._interpolate(self, section,
                                                                        option, rawval, vars)
              def cachefunc(func):
                  '''cache the result of function calls'''
                  # XXX doesn't handle keywords args
                  cache = {}
                  if func.func_code.co_argcount == 1:
                      # we gain a small amount of time because
                      # we don't need to pack/unpack the list
                      def f(arg):
                          if arg not in cache:
                              cache[arg] = func(arg)
                          return cache[arg]
                  else:
                      def f(*args):
                          if args not in cache:
                              cache[args] = func(*args)
                          return cache[args]
                  return f
              def pipefilter(s, cmd):
                  '''filter string S through command CMD, returning its output'''
                  (pin, pout) = os.popen2(cmd, 'b')
                  def writer():
                      try:
                          pin.write(s)
                          pin.close()
                      except IOError, inst:
                          if inst.errno != errno.EPIPE:
                              raise
                  # we should use select instead on UNIX, but this will work on most
                  # systems, including Windows
                  w = threading.Thread(target=writer)
                  w.start()
                  f = pout.read()
                  pout.close()
                  w.join()
                  return f
              def tempfilter(s, cmd):
                  '''filter string S through a pair of temporary files with CMD.
                  CMD is used as a template to create the real command to be run,
                  with the strings INFILE and OUTFILE replaced by the real names of
                  the temporary files generated.'''
                  inname, outname = None, None
                  try:
                      infd, inname = tempfile.mkstemp(prefix='hg-filter-in-')
                      fp = os.fdopen(infd, 'wb')
                      fp.write(s)
                      fp.close()
                      outfd, outname = tempfile.mkstemp(prefix='hg-filter-out-')
                      os.close(outfd)
                      cmd = cmd.replace('INFILE', inname)
                      cmd = cmd.replace('OUTFILE', outname)
                      code = os.system(cmd)
                      if sys.platform == 'OpenVMS' and code & 1:
                          code = 0
                      if code: raise Abort(_("command '%s' failed: %s") %
                                           (cmd, explain_exit(code)))
                      return open(outname, 'rb').read()
                  finally:
                      try:
                          if inname: os.unlink(inname)
                      except: pass
                      try:
                          if outname: os.unlink(outname)
                      except: pass
              filtertable = {
                  'tempfile:': tempfilter,
                  'pipe:': pipefilter,
                  }
              def filter(s, cmd):
                  "filter a string through a command that transforms its input to its output"
                  for name, fn in filtertable.iteritems():
                      if cmd.startswith(name):
                          return fn(s, cmd[len(name):].lstrip())
                  return pipefilter(s, cmd)
              def binary(s):
                  """return true if a string is binary data using diff's heuristic"""
                  if s and '\0' in s[:4096]:
                      return True
                  return False
              def unique(g):
                  """return the uniq elements of iterable g"""
                  seen = {}
                  l = []
                  for f in g:
                      if f not in seen:
                          seen[f] = 1
                          l.append(f)
                  return l
              class Abort(Exception):
                  """Raised if a command needs to print an error and exit."""
              class UnexpectedOutput(Abort):
                  """Raised to print an error with part of output and exit."""
              def always(fn): return True
              def never(fn): return False
              def expand_glob(pats):
                  '''On Windows, expand the implicit globs in a list of patterns'''
                  if os.name != 'nt':
                      return list(pats)
                  ret = []
                  for p in pats:
                      kind, name = patkind(p, None)
                      if kind is None:
                          globbed = glob.glob(name)
                          if globbed:
                              ret.extend(globbed)
                              continue
                          # if we couldn't expand the glob, just keep it around
                      ret.append(p)
                  return ret
              def patkind(name, dflt_pat='glob'):
                  """Split a string into an optional pattern kind prefix and the
                  actual pattern."""
                  for prefix in 're', 'glob', 'path', 'relglob', 'relpath', 'relre':
                      if name.startswith(prefix + ':'): return name.split(':', 1)
                  return dflt_pat, name
              def globre(pat, head='^', tail='$'):
                  "convert a glob pattern into a regexp"
                  i, n = 0, len(pat)
                  res = ''
                  group = False
                  def peek(): return i < n and pat[i]
                  while i < n:
                      c = pat[i]
                      i = i+1
                      if c == '*':
                          if peek() == '*':
                              i += 1
                              res += '.*'
                          else:
                              res += '[^/]*'
                      elif c == '?':
                          res += '.'
                      elif c == '[':
                          j = i
                          if j < n and pat[j] in '!]':
                              j += 1
                          while j < n and pat[j] != ']':
                              j += 1
                          if j >= n:
                              res += '\\['
                          else:
                              stuff = pat[i:j].replace('\\','\\\\')
                              i = j + 1
                              if stuff[0] == '!':
                                  stuff = '^' + stuff[1:]
                              elif stuff[0] == '^':
                                  stuff = '\\' + stuff
                              res = '%s[%s]' % (res, stuff)
                      elif c == '{':
                          group = True
                          res += '(?:'
                      elif c == '}' and group:
                          res += ')'
                          group = False
                      elif c == ',' and group:
                          res += '|'
                      elif c == '\\':
                          p = peek()
                          if p:
                              i += 1
                              res += re.escape(p)
                          else:
                              res += re.escape(c)
                      else:
                          res += re.escape(c)
                  return head + res + tail
              _globchars = {'[': 1, '{': 1, '*': 1, '?': 1}
              def pathto(root, n1, n2):
                  '''return the relative path from one place to another.
                  root should use os.sep to separate directories
                  n1 should use os.sep to separate directories
                  n2 should use "/" to separate directories
                  returns an os.sep-separated path.
                  If n1 is a relative path, it's assumed it's
                  relative to root.
                  n2 should always be relative to root.
                  '''
                  if not n1: return localpath(n2)
                  if os.path.isabs(n1):
                      if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
                          return os.path.join(root, localpath(n2))
                      n2 = '/'.join((pconvert(root), n2))
                  a, b = n1.split(os.sep), n2.split('/')
                  a.reverse()
                  b.reverse()
                  while a and b and a[-1] == b[-1]:
                      a.pop()
                      b.pop()
                  b.reverse()
                  return os.sep.join((['..'] * len(a)) + b)
              def canonpath(root, cwd, myname):
                  """return the canonical path of myname, given cwd and root"""
                  if root == os.sep:
                      rootsep = os.sep
                  elif root.endswith(os.sep):
                      rootsep = root
                  else:
                      rootsep = root + os.sep
                  name = myname
                  if not os.path.isabs(name):
                      name = os.path.join(root, cwd, name)
                  name = os.path.normpath(name)
                  audit_path = path_auditor(root)
                  if name != rootsep and name.startswith(rootsep):
                      name = name[len(rootsep):]
                      audit_path(name)
                      return pconvert(name)
                  elif name == root:
                      return ''
                  else:
                      # Determine whether `name' is in the hierarchy at or beneath `root',
                      # by iterating name=dirname(name) until that causes no change (can't
                      # check name == '/', because that doesn't work on windows).  For each
                      # `name', compare dev/inode numbers.  If they match, the list `rel'
                      # holds the reversed list of components making up the relative file
                      # name we want.
                      root_st = os.stat(root)
                      rel = []
                      while True:
                          try:
                              name_st = os.stat(name)
                          except OSError:
                              break
                          if samestat(name_st, root_st):
                              if not rel:
                                  # name was actually the same as root (maybe a symlink)
                                  return ''
                              rel.reverse()
                              name = os.path.join(*rel)
                              audit_path(name)
                              return pconvert(name)
                          dirname, basename = os.path.split(name)
                          rel.append(basename)
                          if dirname == name:
                              break
                          name = dirname
                      raise Abort('%s not under root' % myname)
              def matcher(canonroot, cwd='', names=[], inc=[], exc=[], src=None):
                  return _matcher(canonroot, cwd, names, inc, exc, 'glob', src)
              def cmdmatcher(canonroot, cwd='', names=[], inc=[], exc=[], src=None,
                             globbed=False, default=None):
                  default = default or 'relpath'
                  if default == 'relpath' and not globbed:
                      names = expand_glob(names)
                  return _matcher(canonroot, cwd, names, inc, exc, default, src)
              def _matcher(canonroot, cwd, names, inc, exc, dflt_pat, src):
                  """build a function to match a set of file patterns
                  arguments:
                  canonroot - the canonical root of the tree you're matching against
                  cwd - the current working directory, if relevant
                  names - patterns to find
                  inc - patterns to include
                  exc - patterns to exclude
                  dflt_pat - if a pattern in names has no explicit type, assume this one
                  src - where these patterns came from (e.g. .hgignore)
                  a pattern is one of:
                  'glob:<glob>' - a glob relative to cwd
                  're:<regexp>' - a regular expression
                  'path:<path>' - a path relative to canonroot
                  'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)
                  'relpath:<path>' - a path relative to cwd
                  'relre:<regexp>' - a regexp that doesn't have to match the start of a name
                  '<something>' - one of the cases above, selected by the dflt_pat argument
                  returns:
                  a 3-tuple containing
                  - list of roots (places where one should start a recursive walk of the fs);
                    this often matches the explicit non-pattern names passed in, but also
                    includes the initial part of glob: patterns that has no glob characters
                  - a bool match(filename) function
                  - a bool indicating if any patterns were passed in
                  """
                  # a common case: no patterns at all
                  if not names and not inc and not exc:
                      return [], always, False
                  def contains_glob(name):
                      for c in name:
                          if c in _globchars: return True
                      return False
                  def regex(kind, name, tail):
                      '''convert a pattern into a regular expression'''
                      if not name:
                          return ''
                      if kind == 're':
                          return name
                      elif kind == 'path':
                          return '^' + re.escape(name) + '(?:/|$)'
                      elif kind == 'relglob':
                          return globre(name, '(?:|.*/)', tail)
                      elif kind == 'relpath':
                          return re.escape(name) + '(?:/|$)'
                      elif kind == 'relre':
                          if name.startswith('^'):
                              return name
                          return '.*' + name
                      return globre(name, '', tail)
                  def matchfn(pats, tail):
                      """build a matching function from a set of patterns"""
                      if not pats:
                          return
                      try:
                          pat = '(?:%s)' % '|'.join([regex(k, p, tail) for (k, p) in pats])
                          return re.compile(pat).match
                      except OverflowError:
                          # We're using a Python with a tiny regex engine and we
                          # made it explode, so we'll divide the pattern list in two
                          # until it works
                          l = len(pats)
                          if l < 2:
                              raise
                          a, b = matchfn(pats[:l/2], tail), matchfn(pats[l/2:], tail)
                          return lambda s: a(s) or b(s)
                      except re.error:
                          for k, p in pats:
                              try:
                                  re.compile('(?:%s)' % regex(k, p, tail))
                              except re.error:
                                  if src:
                                      raise Abort("%s: invalid pattern (%s): %s" %
                                                  (src, k, p))
                                  else:
                                      raise Abort("invalid pattern (%s): %s" % (k, p))
                          raise Abort("invalid pattern")
                  def globprefix(pat):
                      '''return the non-glob prefix of a path, e.g. foo/* -> foo'''
                      root = []
                      for p in pat.split('/'):
                          if contains_glob(p): break
                          root.append(p)
                      return '/'.join(root) or '.'
                  def normalizepats(names, default):
                      pats = []
                      roots = []
                      anypats = False
                      for kind, name in [patkind(p, default) for p in names]:
                          if kind in ('glob', 'relpath'):
                              name = canonpath(canonroot, cwd, name)
                          elif kind in ('relglob', 'path'):
                              name = normpath(name)
                          pats.append((kind, name))
                          if kind in ('glob', 're', 'relglob', 'relre'):
                              anypats = True
                          if kind == 'glob':
                              root = globprefix(name)
                              roots.append(root)
                          elif kind in ('relpath', 'path'):
                              roots.append(name or '.')
                          elif kind == 'relglob':
                              roots.append('.')
                      return roots, pats, anypats
                  roots, pats, anypats = normalizepats(names, dflt_pat)
                  patmatch = matchfn(pats, '$') or always
                  incmatch = always
                  if inc:
                      dummy, inckinds, dummy = normalizepats(inc, 'glob')
                      incmatch = matchfn(inckinds, '(?:/|$)')
                  excmatch = lambda fn: False
                  if exc:
                      dummy, exckinds, dummy = normalizepats(exc, 'glob')
                      excmatch = matchfn(exckinds, '(?:/|$)')
                  if not names and inc and not exc:
                      # common case: hgignore patterns
                      match = incmatch
                  else:
                      match = lambda fn: incmatch(fn) and not excmatch(fn) and patmatch(fn)
                  return (roots, match, (inc or exc or anypats) and True)
              _hgexecutable = None
              def hgexecutable():
                  """return location of the 'hg' executable.
                  Defaults to $HG or 'hg' in the search path.
                  """
                  if _hgexecutable is None:
                      set_hgexecutable(os.environ.get('HG') or find_exe('hg', 'hg'))
                  return _hgexecutable
              def set_hgexecutable(path):
                  """set location of the 'hg' executable"""
                  global _hgexecutable
                  _hgexecutable = path
              def system(cmd, environ={}, cwd=None, onerr=None, errprefix=None):
                  '''enhanced shell command execution.
                  run with environment maybe modified, maybe in different dir.
                  if command fails and onerr is None, return status.  if ui object,
                  print error message and return status, else raise onerr object as
                  exception.'''
                  def py2shell(val):
                      'convert python object into string that is useful to shell'
                      if val in (None, False):
                          return '0'
                      if val == True:
                          return '1'
                      return str(val)
                  oldenv = {}
                  for k in environ:
                      oldenv[k] = os.environ.get(k)
                  if cwd is not None:
                      oldcwd = os.getcwd()
                  origcmd = cmd
                  if os.name == 'nt':
                      cmd = '"%s"' % cmd
                  try:
                      for k, v in environ.iteritems():
                          os.environ[k] = py2shell(v)
                      os.environ['HG'] = hgexecutable()
                      if cwd is not None and oldcwd != cwd:
                          os.chdir(cwd)
                      rc = os.system(cmd)
                      if sys.platform == 'OpenVMS' and rc & 1:
                          rc = 0
                      if rc and onerr:
                          errmsg = '%s %s' % (os.path.basename(origcmd.split(None, 1)[0]),
                                              explain_exit(rc)[0])
                          if errprefix:
                              errmsg = '%s: %s' % (errprefix, errmsg)
                          try:
                              onerr.warn(errmsg + '\n')
                          except AttributeError:
                              raise onerr(errmsg)
                      return rc
                  finally:
                      for k, v in oldenv.iteritems():
                          if v is None:
                              del os.environ[k]
                          else:
                              os.environ[k] = v
                      if cwd is not None and oldcwd != cwd:
                          os.chdir(oldcwd)
              # os.path.lexists is not available on python2.3
              def lexists(filename):
                  "test whether a file with this name exists. does not follow symlinks"
                  try:
                      os.lstat(filename)
                  except:
                      return False
                  return True
              def rename(src, dst):
                  """forcibly rename a file"""
                  try:
                      os.rename(src, dst)
                  except OSError, err: # FIXME: check err (EEXIST ?)
                      # on windows, rename to existing file is not allowed, so we
                      # must delete destination first. but if file is open, unlink
                      # schedules it for delete but does not delete it. rename
                      # happens immediately even for open files, so we create
                      # temporary file, delete it, rename destination to that name,
                      # then delete that. then rename is safe to do.
                      fd, temp = tempfile.mkstemp(dir=os.path.dirname(dst) or '.')
                      os.close(fd)
                      os.unlink(temp)
                      os.rename(dst, temp)
                      os.unlink(temp)
                      os.rename(src, dst)
              def unlink(f):
                  """unlink and remove the directory if it is empty"""
                  os.unlink(f)
                  # try removing directories that might now be empty
                  try:
                      os.removedirs(os.path.dirname(f))
                  except OSError:
                      pass
              def copyfile(src, dest):
                  "copy a file, preserving mode"
                  if os.path.islink(src):
                      try:
                          os.unlink(dest)
                      except:
                          pass
                      os.symlink(os.readlink(src), dest)
                  else:
                      try:
                          shutil.copyfile(src, dest)
                          shutil.copymode(src, dest)
                      except shutil.Error, inst:
                          raise Abort(str(inst))
              def copyfiles(src, dst, hardlink=None):
                  """Copy a directory tree using hardlinks if possible"""
                  if hardlink is None:
                      hardlink = (os.stat(src).st_dev ==
                                  os.stat(os.path.dirname(dst)).st_dev)
                  if os.path.isdir(src):
                      os.mkdir(dst)
                      for name, kind in osutil.listdir(src):
                          srcname = os.path.join(src, name)
                          dstname = os.path.join(dst, name)
                          copyfiles(srcname, dstname, hardlink)
                  else:
                      if hardlink:
                          try:
                              os_link(src, dst)
                          except (IOError, OSError):
                              hardlink = False
                              shutil.copy(src, dst)
                      else:
                          shutil.copy(src, dst)
              class path_auditor(object):
                  '''ensure that a filesystem path contains no banned components.
                  the following properties of a path are checked:
                  - under top-level .hg
                  - starts at the root of a windows drive
                  - contains ".."
                  - traverses a symlink (e.g. a/symlink_here/b)
                  - inside a nested repository'''
                  def __init__(self, root):
                      self.audited = set()
                      self.auditeddir = set()
                      self.root = root
                  def __call__(self, path):
                      if path in self.audited:
                          return
                      normpath = os.path.normcase(path)
                      parts = normpath.split(os.sep)
                      if (os.path.splitdrive(path)[0] or parts[0] in ('.hg', '')
                          or os.pardir in parts):
                          raise Abort(_("path contains illegal component: %s") % path)
                      def check(prefix):
                          curpath = os.path.join(self.root, prefix)
                          try:
                              st = os.lstat(curpath)
                          except OSError, err:
                              # EINVAL can be raised as invalid path syntax under win32.
                              # They must be ignored for patterns can be checked too.
                              if err.errno not in (errno.ENOENT, errno.EINVAL):
                                  raise
                          else:
                              if stat.S_ISLNK(st.st_mode):
                                  raise Abort(_('path %r traverses symbolic link %r') %
                                              (path, prefix))
                              elif (stat.S_ISDIR(st.st_mode) and
                                    os.path.isdir(os.path.join(curpath, '.hg'))):
                                  raise Abort(_('path %r is inside repo %r') %
                                              (path, prefix))
                      prefixes = []
                      for c in strutil.rfindall(normpath, os.sep):
                          prefix = normpath[:c]
                          if prefix in self.auditeddir:
                              break
                          check(prefix)
                          prefixes.append(prefix)
                      self.audited.add(path)
                      # only add prefixes to the cache after checking everything: we don't
                      # want to add "foo/bar/baz" before checking if there's a "foo/.hg"
                      self.auditeddir.update(prefixes)
              def _makelock_file(info, pathname):
                  ld = os.open(pathname, os.O_CREAT | os.O_WRONLY | os.O_EXCL)
                  os.write(ld, info)
                  os.close(ld)
              def _readlock_file(pathname):
                  return posixfile(pathname).read()
              def nlinks(pathname):
                  """Return number of hardlinks for the given file."""
                  return os.lstat(pathname).st_nlink
              if hasattr(os, 'link'):
                  os_link = os.link
              else:
                  def os_link(src, dst):
                      raise OSError(0, _("Hardlinks not supported"))
              def fstat(fp):
                  '''stat file object that may not have fileno method.'''
                  try:
                      return os.fstat(fp.fileno())
                  except AttributeError:
                      return os.stat(fp.name)
              posixfile = file
              def is_win_9x():
                  '''return true if run on windows 95, 98 or me.'''
                  try:
                      return sys.getwindowsversion()[3] == 1
                  except AttributeError:
                      return os.name == 'nt' and 'command' in os.environ.get('comspec', '')
              getuser_fallback = None
              def getuser():
                  '''return name of current user'''
                  try:
                      return getpass.getuser()
                  except ImportError:
                      # import of pwd will fail on windows - try fallback
                      if getuser_fallback:
                          return getuser_fallback()
                  # raised if win32api not available
                  raise Abort(_('user name not available - set USERNAME '
                                'environment variable'))
              def username(uid=None):
                  """Return the name of the user with the given uid.
                  If uid is None, return the name of the current user."""
                  try:
                      import pwd
                      if uid is None:
                          uid = os.getuid()
                      try:
                          return pwd.getpwuid(uid)[0]
                      except KeyError:
                          return str(uid)
                  except ImportError:
                      return None
              def groupname(gid=None):
                  """Return the name of the group with the given gid.
                  If gid is None, return the name of the current group."""
                  try:
                      import grp
                      if gid is None:
                          gid = os.getgid()
                      try:
                          return grp.getgrgid(gid)[0]
                      except KeyError:
                          return str(gid)
                  except ImportError:
                      return None
              # File system features
              def checkfolding(path):
                  """
                  Check whether the given path is on a case-sensitive filesystem
                  Requires a path (like /foo/.hg) ending with a foldable final
                  directory component.
                  """
                  s1 = os.stat(path)
                  d, b = os.path.split(path)
                  p2 = os.path.join(d, b.upper())
                  if path == p2:
                      p2 = os.path.join(d, b.lower())
                  try:
                      s2 = os.stat(p2)
                      if s2 == s1:
                          return False
                      return True
                  except:
                      return True
              def checkexec(path):
                  """
                  Check whether the given path is on a filesystem with UNIX-like exec flags
                  Requires a directory (like /foo/.hg)
                  """
                  try:
                      EXECFLAGS = stat.S_IXUSR | stat.S_IXGRP | stat.S_IXOTH
                      fh, fn = tempfile.mkstemp("", "", path)
                      os.close(fh)
                      m = os.stat(fn).st_mode
                      # VFAT on Linux can flip mode but it doesn't persist a FS remount.
                      # frequently we can detect it if files are created with exec bit on.
                      new_file_has_exec = m & EXECFLAGS
                      os.chmod(fn, m ^ EXECFLAGS)
                      exec_flags_cannot_flip = (os.stat(fn).st_mode == m)
                      os.unlink(fn)
                  except (IOError,OSError):
                      # we don't care, the user probably won't be able to commit anyway
                      return False
                  return not (new_file_has_exec or exec_flags_cannot_flip)
              def execfunc(path, fallback):
                  '''return an is_exec() function with default to fallback'''
                  if checkexec(path):
                      return lambda x: is_exec(os.path.join(path, x))
                  return fallback
              def checklink(path):
                  """check whether the given path is on a symlink-capable filesystem"""
                  # mktemp is not racy because symlink creation will fail if the
                  # file already exists
                  name = tempfile.mktemp(dir=path)
                  try:
                      os.symlink(".", name)
                      os.unlink(name)
                      return True
                  except (OSError, AttributeError):
                      return False
              def linkfunc(path, fallback):
                  '''return an is_link() function with default to fallback'''
                  if checklink(path):
                      return lambda x: os.path.islink(os.path.join(path, x))
                  return fallback
              _umask = os.umask(0)
              os.umask(_umask)
              def needbinarypatch():
                  """return True if patches should be applied in binary mode by default."""
                  return os.name == 'nt'
              # Platform specific variants
              if os.name == 'nt':
                  import msvcrt
                  nulldev = 'NUL:'
                  class winstdout:
                      '''stdout on windows misbehaves if sent through a pipe'''
                      def __init__(self, fp):
                          self.fp = fp
                      def __getattr__(self, key):
                          return getattr(self.fp, key)
                      def close(self):
                          try:
                              self.fp.close()
                          except: pass
                      def write(self, s):
                          try:
                              return self.fp.write(s)
                          except IOError, inst:
                              if inst.errno != 0: raise
                              self.close()
                              raise IOError(errno.EPIPE, 'Broken pipe')
                      def flush(self):
                          try:
                              return self.fp.flush()
                          except IOError, inst:
                              if inst.errno != errno.EINVAL: raise
                              self.close()
                              raise IOError(errno.EPIPE, 'Broken pipe')
                  sys.stdout = winstdout(sys.stdout)
                  def system_rcpath():
                      try:
                          return system_rcpath_win32()
                      except:
                          return [r'c:\mercurial\mercurial.ini']
                  def user_rcpath():
                      '''return os-specific hgrc search path to the user dir'''
                      try:
                          userrc = user_rcpath_win32()
                      except:
                          userrc = os.path.join(os.path.expanduser('~'), 'mercurial.ini')
                      path = [userrc]
                      userprofile = os.environ.get('USERPROFILE')
                      if userprofile:
                          path.append(os.path.join(userprofile, 'mercurial.ini'))
                      return path
                  def parse_patch_output(output_line):
                      """parses the output produced by patch and returns the file name"""
                      pf = output_line[14:]
                      if pf[0] == '`':
                          pf = pf[1:-1] # Remove the quotes
                      return pf
                  def testpid(pid):
                      '''return False if pid dead, True if running or not known'''
                      return True
                  def set_exec(f, mode):
                      pass
                  def set_link(f, mode):
                      pass
                  def set_binary(fd):
                      msvcrt.setmode(fd.fileno(), os.O_BINARY)
                  def pconvert(path):
                      return path.replace("\\", "/")
                  def localpath(path):
                      return path.replace('/', '\\')
                  def normpath(path):
                      return pconvert(os.path.normpath(path))
                  makelock = _makelock_file
                  readlock = _readlock_file
                  def samestat(s1, s2):
                      return False
                  # A sequence of backslashes is special iff it precedes a double quote:
                  # - if there's an even number of backslashes, the double quote is not
                  #   quoted (i.e. it ends the quoted region)
                  # - if there's an odd number of backslashes, the double quote is quoted
                  # - in both cases, every pair of backslashes is unquoted into a single
                  #   backslash
                  # (See http://msdn2.microsoft.com/en-us/library/a1y7w461.aspx )
                  # So, to quote a string, we must surround it in double quotes, double
                  # the number of backslashes that preceed double quotes and add another
                  # backslash before every double quote (being careful with the double
                  # quote we've appended to the end)
                  _quotere = None
                  def shellquote(s):
                      global _quotere
                      if _quotere is None:
                          _quotere = re.compile(r'(\\*)("|\\$)')
                      return '"%s"' % _quotere.sub(r'\1\1\\\2', s)
                  def quotecommand(cmd):
                      """Build a command string suitable for os.popen* calls."""
                      # The extra quotes are needed because popen* runs the command
                      # through the current COMSPEC. cmd.exe suppress enclosing quotes.
                      return '"' + cmd + '"'
                  def explain_exit(code):
                      return _("exited with status %d") % code, code
                  # if you change this stub into a real check, please try to implement the
                  # username and groupname functions above, too.
                  def isowner(fp, st=None):
                      return True
                  def find_in_path(name, path, default=None):
                      '''find name in search path. path can be string (will be split
                      with os.pathsep), or iterable thing that returns strings.  if name
                      found, return path to name. else return default. name is looked up
                      using cmd.exe rules, using PATHEXT.'''
                      if isinstance(path, str):
                          path = path.split(os.pathsep)
                      pathext = os.environ.get('PATHEXT', '.COM;.EXE;.BAT;.CMD')
                      pathext = pathext.lower().split(os.pathsep)
                      isexec = os.path.splitext(name)[1].lower() in pathext
                      for p in path:
                          p_name = os.path.join(p, name)
                          if isexec and os.path.exists(p_name):
                              return p_name
                          for ext in pathext:
                              p_name_ext = p_name + ext
                              if os.path.exists(p_name_ext):
                                  return p_name_ext
                      return default
                  def set_signal_handler():
                      try:
                          set_signal_handler_win32()
                      except NameError:
                          pass
                  try:
                      # override functions with win32 versions if possible
                      from util_win32 import *
                      if not is_win_9x():
                          posixfile = posixfile_nt
                  except ImportError:
                      pass
              else:
                  nulldev = '/dev/null'
                  def rcfiles(path):
                      rcs = [os.path.join(path, 'hgrc')]
                      rcdir = os.path.join(path, 'hgrc.d')
                      try:
                          rcs.extend([os.path.join(rcdir, f)
                                      for f, kind in osutil.listdir(rcdir)
                                      if f.endswith(".rc")])
                      except OSError:
                          pass
                      return rcs
                  def system_rcpath():
                      path = []
                      # old mod_python does not set sys.argv
                      if len(getattr(sys, 'argv', [])) > 0:
                          path.extend(rcfiles(os.path.dirname(sys.argv[0]) +
                                                '/../etc/mercurial'))
                      path.extend(rcfiles('/etc/mercurial'))
                      return path
                  def user_rcpath():
                      return [os.path.expanduser('~/.hgrc')]
                  def parse_patch_output(output_line):
                      """parses the output produced by patch and returns the file name"""
                      pf = output_line[14:]
                      if os.sys.platform == 'OpenVMS':
                          if pf[0] == '`':
                              pf = pf[1:-1] # Remove the quotes
                      else:
                         if pf.startswith("'") and pf.endswith("'") and " " in pf:
                              pf = pf[1:-1] # Remove the quotes
                      return pf
                  def is_exec(f):
                      """check whether a file is executable"""
                      return (os.lstat(f).st_mode & 0100 != 0)
                  def set_exec(f, mode):
                      s = os.lstat(f).st_mode
                      if stat.S_ISLNK(s) or (s & 0100 != 0) == mode:
                          return
                      if mode:
                          # Turn on +x for every +r bit when making a file executable
                          # and obey umask.
                          os.chmod(f, s | (s & 0444) >> 2 & ~_umask)
                      else:
                          os.chmod(f, s & 0666)
                  def set_link(f, mode):
                      """make a file a symbolic link/regular file
                      if a file is changed to a link, its contents become the link data
                      if a link is changed to a file, its link data become its contents
                      """
                      m = os.path.islink(f)
                      if m == bool(mode):
                          return
                      if mode: # switch file to link
                          data = file(f).read()
                          os.unlink(f)
                          os.symlink(data, f)
                      else:
                          data = os.readlink(f)
                          os.unlink(f)
                          file(f, "w").write(data)
                  def set_binary(fd):
                      pass
                  def pconvert(path):
                      return path
                  def localpath(path):
                      return path
                  normpath = os.path.normpath
                  samestat = os.path.samestat
                  def makelock(info, pathname):
                      try:
                          os.symlink(info, pathname)
                      except OSError, why:
                          if why.errno == errno.EEXIST:
                              raise
                          else:
                              _makelock_file(info, pathname)
                  def readlock(pathname):
                      try:
                          return os.readlink(pathname)
                      except OSError, why:
                          if why.errno in (errno.EINVAL, errno.ENOSYS):
                              return _readlock_file(pathname)
                          else:
                              raise
                  def shellquote(s):
                      if os.sys.platform == 'OpenVMS':
                          return '"%s"' % s
                      else:
                          return "'%s'" % s.replace("'", "'\\''")
                  def quotecommand(cmd):
                      return cmd
                  def testpid(pid):
                      '''return False if pid dead, True if running or not sure'''
                      if os.sys.platform == 'OpenVMS':
                          return True
                      try:
                          os.kill(pid, 0)
                          return True
                      except OSError, inst:
                          return inst.errno != errno.ESRCH
                  def explain_exit(code):
                      """return a 2-tuple (desc, code) describing a process's status"""
                      if os.WIFEXITED(code):
                          val = os.WEXITSTATUS(code)
                          return _("exited with status %d") % val, val
                      elif os.WIFSIGNALED(code):
                          val = os.WTERMSIG(code)
                          return _("killed by signal %d") % val, val
                      elif os.WIFSTOPPED(code):
                          val = os.WSTOPSIG(code)
                          return _("stopped by signal %d") % val, val
                      raise ValueError(_("invalid exit code"))
                  def isowner(fp, st=None):
                      """Return True if the file object f belongs to the current user.
                      The return value of a util.fstat(f) may be passed as the st argument.
                      """
                      if st is None:
                          st = fstat(fp)
                      return st.st_uid == os.getuid()
                  def find_in_path(name, path, default=None):
                      '''find name in search path. path can be string (will be split
                      with os.pathsep), or iterable thing that returns strings.  if name
                      found, return path to name. else return default.'''
                      if isinstance(path, str):
                          path = path.split(os.pathsep)
                      for p in path:
                          p_name = os.path.join(p, name)
                          if os.path.exists(p_name):
                              return p_name
                      return default
                  def set_signal_handler():
                      pass
              def find_exe(name, default=None):
                  '''find path of an executable.
                  if name contains a path component, return it as is.  otherwise,
                  use normal executable search path.'''
                  if os.sep in name or sys.platform == 'OpenVMS':
                      # don't check the executable bit.  if the file isn't
                      # executable, whoever tries to actually run it will give a
                      # much more useful error message.
                      return name
                  return find_in_path(name, os.environ.get('PATH', ''), default=default)
              def _buildencodefun():
                  e = '_'
                  win_reserved = [ord(x) for x in '\\:*?"<>|']
                  cmap = dict([ (chr(x), chr(x)) for x in xrange(127) ])
                  for x in (range(32) + range(126, 256) + win_reserved):
                      cmap[chr(x)] = "~%02x" % x
                  for x in range(ord("A"), ord("Z")+1) + [ord(e)]:
                      cmap[chr(x)] = e + chr(x).lower()
                  dmap = {}
                  for k, v in cmap.iteritems():
                      dmap[v] = k
                  def decode(s):
                      i = 0
                      while i < len(s):
                          for l in xrange(1, 4):
                              try:
                                  yield dmap[s[i:i+l]]
                                  i += l
                                  break
                              except KeyError:
                                  pass
                          else:
                              raise KeyError
                  return (lambda s: "".join([cmap[c] for c in s]),
                          lambda s: "".join(list(decode(s))))
              encodefilename, decodefilename = _buildencodefun()
              def encodedopener(openerfn, fn):
                  def o(path, *args, **kw):
                      return openerfn(fn(path), *args, **kw)
                  return o
              def mktempcopy(name, emptyok=False):
                  """Create a temporary file with the same contents from name
                  The permission bits are copied from the original file.
                  If the temporary file is going to be truncated immediately, you
                  can use emptyok=True as an optimization.
                  Returns the name of the temporary file.
                  """
                  d, fn = os.path.split(name)
                  fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, dir=d)
                  os.close(fd)
                  # Temporary files are created with mode 0600, which is usually not
                  # what we want.  If the original file already exists, just copy
                  # its mode.  Otherwise, manually obey umask.
                  try:
                      st_mode = os.lstat(name).st_mode
                  except OSError, inst:
                      if inst.errno != errno.ENOENT:
                          raise
                      st_mode = 0666 & ~_umask
                  os.chmod(temp, st_mode)
                  if emptyok:
                      return temp
                  try:
                      try:
                          ifp = posixfile(name, "rb")
                      except IOError, inst:
                          if inst.errno == errno.ENOENT:
                              return temp
                          if not getattr(inst, 'filename', None):
                              inst.filename = name
                          raise
                      ofp = posixfile(temp, "wb")
                      for chunk in filechunkiter(ifp):
                          ofp.write(chunk)
                      ifp.close()
                      ofp.close()
                  except:
                      try: os.unlink(temp)
                      except: pass
                      raise
                  return temp
              class atomictempfile(posixfile):
                  """file-like object that atomically updates a file
                  All writes will be redirected to a temporary copy of the original
                  file.  When rename is called, the copy is renamed to the original
                  name, making the changes visible.
                  """
                  def __init__(self, name, mode):
                      self.__name = name
                      self.temp = mktempcopy(name, emptyok=('w' in mode))
                      posixfile.__init__(self, self.temp, mode)
                  def rename(self):
                      if not self.closed:
                          posixfile.close(self)
                          rename(self.temp, localpath(self.__name))
                  def __del__(self):
                      if not self.closed:
                          try:
                              os.unlink(self.temp)
                          except: pass
                          posixfile.close(self)
              class opener(object):
                  """Open files relative to a base directory
                  This class is used to hide the details of COW semantics and
                  remote file access from higher level code.
                  """
                  def __init__(self, base, audit=True):
                      self.base = base
                      if audit:
                          self.audit_path = path_auditor(base)
                      else:
                          self.audit_path = always
                  def __getattr__(self, name):
                      if name == '_can_symlink':
                          self._can_symlink = checklink(self.base)
                          return self._can_symlink
                      raise AttributeError(name)
                  def __call__(self, path, mode="r", text=False, atomictemp=False):
                      self.audit_path(path)
                      f = os.path.join(self.base, path)
                      if not text and "b" not in mode:
                          mode += "b" # for that other OS
                      if mode[0] != "r":
                          try:
                              nlink = nlinks(f)
                          except OSError:
                              nlink = 0
                              d = os.path.dirname(f)
                              if not os.path.isdir(d):
                                  os.makedirs(d)
                          if atomictemp:
                              return atomictempfile(f, mode)
                          if nlink > 1:
                              rename(mktempcopy(f), f)
                      return posixfile(f, mode)
                  def symlink(self, src, dst):
                      self.audit_path(dst)
                      linkname = os.path.join(self.base, dst)
                      try:
                          os.unlink(linkname)
                      except OSError:
                          pass
                      dirname = os.path.dirname(linkname)
                      if not os.path.exists(dirname):
                          os.makedirs(dirname)
                      if self._can_symlink:
                          try:
                              os.symlink(src, linkname)
                          except OSError, err:
                              raise OSError(err.errno, _('could not symlink to %r: %s') %
                                            (src, err.strerror), linkname)
                      else:
                          f = self(dst, "w")
                          f.write(src)
                          f.close()
              class chunkbuffer(object):
                  """Allow arbitrary sized chunks of data to be efficiently read from an
                  iterator over chunks of arbitrary size."""
                  def __init__(self, in_iter):
                      """in_iter is the iterator that's iterating over the input chunks.
                      targetsize is how big a buffer to try to maintain."""
                      self.iter = iter(in_iter)
                      self.buf = ''
                      self.targetsize = 2**16
                  def read(self, l):
                      """Read L bytes of data from the iterator of chunks of data.
                      Returns less than L bytes if the iterator runs dry."""
                      if l > len(self.buf) and self.iter:
                          # Clamp to a multiple of self.targetsize
                          targetsize = max(l, self.targetsize)
                          collector = cStringIO.StringIO()
                          collector.write(self.buf)
                          collected = len(self.buf)
                          for chunk in self.iter:
                              collector.write(chunk)
                              collected += len(chunk)
                              if collected >= targetsize:
                                  break
                          if collected < targetsize:
                              self.iter = False
                          self.buf = collector.getvalue()
                      if len(self.buf) == l:
-                         s, self.buf = self.buf, ''
+                         s, self.buf = str(self.buf), ''
                      else:
                          s, self.buf = self.buf[:l], buffer(self.buf, l)
                      return s
              def filechunkiter(f, size=65536, limit=None):
                  """Create a generator that produces the data in the file size
                  (default 65536) bytes at a time, up to optional limit (default is
                  to read all data).  Chunks may be less than size bytes if the
                  chunk is the last chunk in the file, or the file is a socket or
                  some other type of file that sometimes reads less data than is
                  requested."""
                  assert size >= 0
                  assert limit is None or limit >= 0
                  while True:
                      if limit is None: nbytes = size
                      else: nbytes = min(limit, size)
                      s = nbytes and f.read(nbytes)
                      if not s: break
                      if limit: limit -= len(s)
                      yield s
              def makedate():
                  lt = time.localtime()
                  if lt[8] == 1 and time.daylight:
                      tz = time.altzone
                  else:
                      tz = time.timezone
                  return time.mktime(lt), tz
              def datestr(date=None, format='%a %b %d %H:%M:%S %Y', timezone=True, timezone_format=" %+03d%02d"):
                  """represent a (unixtime, offset) tuple as a localized time.
                  unixtime is seconds since the epoch, and offset is the time zone's
                  number of seconds away from UTC. if timezone is false, do not
                  append time zone to string."""
                  t, tz = date or makedate()
                  s = time.strftime(format, time.gmtime(float(t) - tz))
                  if timezone:
                      s += timezone_format % (-tz / 3600, ((-tz % 3600) / 60))
                  return s
              def strdate(string, format, defaults=[]):
                  """parse a localized time string and return a (unixtime, offset) tuple.
                  if the string cannot be parsed, ValueError is raised."""
                  def timezone(string):
                      tz = string.split()[-1]
                      if tz[0] in "+-" and len(tz) == 5 and tz[1:].isdigit():
                          tz = int(tz)
                          offset = - 3600 * (tz / 100) - 60 * (tz % 100)
                          return offset
                      if tz == "GMT" or tz == "UTC":
                          return 0
                      return None
                  # NOTE: unixtime = localunixtime + offset
                  offset, date = timezone(string), string
                  if offset != None:
                      date = " ".join(string.split()[:-1])
                  # add missing elements from defaults
                  for part in defaults:
                      found = [True for p in part if ("%"+p) in format]
                      if not found:
                          date += "@" + defaults[part]
                          format += "@%" + part[0]
                  timetuple = time.strptime(date, format)
                  localunixtime = int(calendar.timegm(timetuple))
                  if offset is None:
                      # local timezone
                      unixtime = int(time.mktime(timetuple))
                      offset = unixtime - localunixtime
                  else:
                      unixtime = localunixtime + offset
                  return unixtime, offset
              def parsedate(string, formats=None, defaults=None):
                  """parse a localized time string and return a (unixtime, offset) tuple.
                  The date may be a "unixtime offset" string or in one of the specified
                  formats."""
                  if not string:
                      return 0, 0
                  if not formats:
                      formats = defaultdateformats
                  string = string.strip()
                  try:
                      when, offset = map(int, string.split(' '))
                  except ValueError:
                      # fill out defaults
                      if not defaults:
                          defaults = {}
                      now = makedate()
                      for part in "d mb yY HI M S".split():
                          if part not in defaults:
                              if part[0] in "HMS":
                                  defaults[part] = "00"
                              elif part[0] in "dm":
                                  defaults[part] = "1"
                              else:
                                  defaults[part] = datestr(now, "%" + part[0], False)
                      for format in formats:
                          try:
                              when, offset = strdate(string, format, defaults)
                          except ValueError:
                              pass
                          else:
                              break
                      else:
                          raise Abort(_('invalid date: %r ') % string)
                  # validate explicit (probably user-specified) date and
                  # time zone offset. values must fit in signed 32 bits for
                  # current 32-bit linux runtimes. timezones go from UTC-12
                  # to UTC+14
                  if abs(when) > 0x7fffffff:
                      raise Abort(_('date exceeds 32 bits: %d') % when)
                  if offset < -50400 or offset > 43200:
                      raise Abort(_('impossible time zone offset: %d') % offset)
                  return when, offset
              def matchdate(date):
                  """Return a function that matches a given date match specifier
                  Formats include:
                  '{date}' match a given date to the accuracy provided
                  '<{date}' on or before a given date
                  '>{date}' on or after a given date
                  """
                  def lower(date):
                      return parsedate(date, extendeddateformats)[0]
                  def upper(date):
                      d = dict(mb="12", HI="23", M="59", S="59")
                      for days in "31 30 29".split():
                          try:
                              d["d"] = days
                              return parsedate(date, extendeddateformats, d)[0]
                          except:
                              pass
                      d["d"] = "28"
                      return parsedate(date, extendeddateformats, d)[0]
                  if date[0] == "<":
                      when = upper(date[1:])
                      return lambda x: x <= when
                  elif date[0] == ">":
                      when = lower(date[1:])
                      return lambda x: x >= when
                  elif date[0] == "-":
                      try:
                          days = int(date[1:])
                      except ValueError:
                          raise Abort(_("invalid day spec: %s") % date[1:])
                      when = makedate()[0] - days * 3600 * 24
                      return lambda x: x >= when
                  elif " to " in date:
                      a, b = date.split(" to ")
                      start, stop = lower(a), upper(b)
                      return lambda x: x >= start and x <= stop
                  else:
                      start, stop = lower(date), upper(date)
                      return lambda x: x >= start and x <= stop
              def shortuser(user):
                  """Return a short representation of a user name or email address."""
                  f = user.find('@')
                  if f >= 0:
                      user = user[:f]
                  f = user.find('<')
                  if f >= 0:
                      user = user[f+1:]
                  f = user.find(' ')
                  if f >= 0:
                      user = user[:f]
                  f = user.find('.')
                  if f >= 0:
                      user = user[:f]
                  return user
              def ellipsis(text, maxlength=400):
                  """Trim string to at most maxlength (default: 400) characters."""
                  if len(text) <= maxlength:
                      return text
                  else:
                      return "%s..." % (text[:maxlength-3])
              def walkrepos(path):
                  '''yield every hg repository under path, recursively.'''
                  def errhandler(err):
                      if err.filename == path:
                          raise err
                  for root, dirs, files in os.walk(path, onerror=errhandler):
                      for d in dirs:
                          if d == '.hg':
                              yield root
                              dirs[:] = []
                              break
              _rcpath = None
              def os_rcpath():
                  '''return default os-specific hgrc search path'''
                  path = system_rcpath()
                  path.extend(user_rcpath())
                  path = [os.path.normpath(f) for f in path]
                  return path
              def rcpath():
                  '''return hgrc search path. if env var HGRCPATH is set, use it.
                  for each item in path, if directory, use files ending in .rc,
                  else use item.
                  make HGRCPATH empty to only look in .hg/hgrc of current repo.
                  if no HGRCPATH, use default os-specific path.'''
                  global _rcpath
                  if _rcpath is None:
                      if 'HGRCPATH' in os.environ:
                          _rcpath = []
                          for p in os.environ['HGRCPATH'].split(os.pathsep):
                              if not p: continue
                              if os.path.isdir(p):
                                  for f, kind in osutil.listdir(p):
                                      if f.endswith('.rc'):
                                          _rcpath.append(os.path.join(p, f))
                              else:
                                  _rcpath.append(p)
                      else:
                          _rcpath = os_rcpath()
                  return _rcpath
              def bytecount(nbytes):
                  '''return byte count formatted as readable string, with units'''
                  units = (
                      (100, 1<<30, _('%.0f GB')),
                      (10, 1<<30, _('%.1f GB')),
                      (1, 1<<30, _('%.2f GB')),
                      (100, 1<<20, _('%.0f MB')),
                      (10, 1<<20, _('%.1f MB')),
                      (1, 1<<20, _('%.2f MB')),
                      (100, 1<<10, _('%.0f KB')),
                      (10, 1<<10, _('%.1f KB')),
                      (1, 1<<10, _('%.2f KB')),
                      (1, 1, _('%.0f bytes')),
                      )
                  for multiplier, divisor, format in units:
                      if nbytes >= divisor * multiplier:
                          return format % (nbytes / float(divisor))
                  return units[-1][2] % nbytes
              def drop_scheme(scheme, path):
                  sc = scheme + ':'
                  if path.startswith(sc):
                      path = path[len(sc):]
                      if path.startswith('//'):
                          path = path[2:]
                  return path
              def uirepr(s):
                  # Avoid double backslash in Windows path repr()
                  return repr(s).replace('\\\\', '\\')

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages