upstream/mercurial-mirror Commit - r11670:1b3b843e

chunkbuffer: split big strings directly in chunkbuffer

Benoit Boissinot -

r11670:1b3b843e default

parent child

mercurial/revlog.py

0 +1 -8

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev, short #@UnusedImport
             from i18n import _
             import changegroup, ancestor, mdiff, parsers, error, util
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             # amount of data read unconditionally, should be >= 4
             # when not inline: threshold for using lazy index
             _prereadsize = 1048576
             # max size of revlog with inline data
             _maxinline = 131072
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text:
                     return ("", text)
                 l = len(text)
                 bin = None
                 if l < 44:
                     pass
                 elif l > 1000000:
                     # zlib makes an internal copy, thus doubling memory usage for
                     # large files, so lets do this in pieces
                     z = zlib.compressobj()
                     p = []
                     pos = 0
                     while pos < l:
                         pos2 = pos + 2**20
                         p.append(z.compress(text[pos:pos2]))
                         pos = pos2
                     p.append(z.flush())
                     if sum(map(len, p)) < l:
                         bin = "".join(p)
                 else:
                     bin = _compress(text)
                 if bin is None or len(bin) > l:
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     return _decompress(bin)
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             class lazyparser(object):
                 """
                 this class avoids the need to parse the entirety of large indices
                 """
                 # lazyparser is not safe to use on windows if win32 extensions not
                 # available. it keeps file handle open, which make it not possible
                 # to break hardlinks on local cloned repos.
                 def __init__(self, dataf):
                     try:
                         size = util.fstat(dataf).st_size
                     except AttributeError:
                         size = 0
                     self.dataf = dataf
                     self.s = struct.calcsize(indexformatng)
                     self.datasize = size
                     self.l = size // self.s
                     self.index = [None] * self.l
                     self.map = {nullid: nullrev}
                     self.allmap = 0
                     self.all = 0
                     self.mapfind_count = 0
                 def loadmap(self):
                     """
                     during a commit, we need to make sure the rev being added is
                     not a duplicate.  This requires loading the entire index,
                     which is fairly slow.  loadmap can load up just the node map,
                     which takes much less time.
                     """
                     if self.allmap:
                         return
                     end = self.datasize
                     self.allmap = 1
                     cur = 0
                     count = 0
                     blocksize = self.s * 256
                     self.dataf.seek(0)
                     while cur < end:
                         data = self.dataf.read(blocksize)
                         off = 0
                         for x in xrange(256):
                             n = data[off + ngshaoffset:off + ngshaoffset + 20]
                             self.map[n] = count
                             count += 1
                             if count >= self.l:
                                 break
                             off += self.s
                         cur += blocksize
                 def loadblock(self, blockstart, blocksize, data=None):
                     if self.all:
                         return
                     if data is None:
                         self.dataf.seek(blockstart)
                         if blockstart + blocksize > self.datasize:
                             # the revlog may have grown since we've started running,
                             # but we don't have space in self.index for more entries.
                             # limit blocksize so that we don't get too much data.
                             blocksize = max(self.datasize - blockstart, 0)
                         data = self.dataf.read(blocksize)
                     lend = len(data) // self.s
                     i = blockstart // self.s
                     off = 0
                     # lazyindex supports __delitem__
                     if lend > len(self.index) - i:
                         lend = len(self.index) - i
                     for x in xrange(lend):
                         if self.index[i + x] is None:
                             b = data[off : off + self.s]
                             self.index[i + x] = b
                             n = b[ngshaoffset:ngshaoffset + 20]
                             self.map[n] = i + x
                         off += self.s
                 def findnode(self, node):
                     """search backwards through the index file for a specific node"""
                     if self.allmap:
                         return None
                     # hg log will cause many many searches for the manifest
                     # nodes.  After we get called a few times, just load the whole
                     # thing.
                     if self.mapfind_count > 8:
                         self.loadmap()
                         if node in self.map:
                             return node
                         return None
                     self.mapfind_count += 1
                     last = self.l - 1
                     while self.index[last] != None:
                         if last == 0:
                             self.all = 1
                             self.allmap = 1
                             return None
                         last -= 1
                     end = (last + 1) * self.s
                     blocksize = self.s * 256
                     while end >= 0:
                         start = max(end - blocksize, 0)
                         self.dataf.seek(start)
                         data = self.dataf.read(end - start)
                         findend = end - start
                         while True:
                             # we're searching backwards, so we have to make sure
                             # we don't find a changeset where this node is a parent
                             off = data.find(node, 0, findend)
                             findend = off
                             if off >= 0:
                                 i = off / self.s
                                 off = i * self.s
                                 n = data[off + ngshaoffset:off + ngshaoffset + 20]
                                 if n == node:
                                     self.map[n] = i + start / self.s
                                     return node
                             else:
                                 break
                         end -= blocksize
                     return None
                 def loadindex(self, i=None, end=None):
                     if self.all:
                         return
                     all = False
                     if i is None:
                         blockstart = 0
                         blocksize = (65536 / self.s) * self.s
                         end = self.datasize
                         all = True
                     else:
                         if end:
                             blockstart = i * self.s
                             end = end * self.s
                             blocksize = end - blockstart
                         else:
                             blockstart = (i & ~1023) * self.s
                             blocksize = self.s * 1024
                             end = blockstart + blocksize
                     while blockstart < end:
                         self.loadblock(blockstart, blocksize)
                         blockstart += blocksize
                     if all:
                         self.all = True
             class lazyindex(object):
                 """a lazy version of the index array"""
                 def __init__(self, parser):
                     self.p = parser
                 def __len__(self):
                     return len(self.p.index)
                 def load(self, pos):
                     if pos < 0:
                         pos += len(self.p.index)
                     self.p.loadindex(pos)
                     return self.p.index[pos]
                 def __getitem__(self, pos):
                     return _unpack(indexformatng, self.p.index[pos] or self.load(pos))
                 def __setitem__(self, pos, item):
                     self.p.index[pos] = _pack(indexformatng, *item)
                 def __delitem__(self, pos):
                     del self.p.index[pos]
                 def insert(self, pos, e):
                     self.p.index.insert(pos, _pack(indexformatng, *e))
                 def append(self, e):
                     self.p.index.append(_pack(indexformatng, *e))
             class lazymap(object):
                 """a lazy version of the node map"""
                 def __init__(self, parser):
                     self.p = parser
                 def load(self, key):
                     n = self.p.findnode(key)
                     if n is None:
                         raise KeyError(key)
                 def __contains__(self, key):
                     if key in self.p.map:
                         return True
                     self.p.loadmap()
                     return key in self.p.map
                 def __iter__(self):
                     yield nullid
                     for i, ret in enumerate(self.p.index):
                         if not ret:
                             self.p.loadindex(i)
                             ret = self.p.index[i]
                         if isinstance(ret, str):
                             ret = _unpack(indexformatng, ret)
                         yield ret[7]
                 def __getitem__(self, key):
                     try:
                         return self.p.map[key]
                     except KeyError:
                         try:
                             self.load(key)
                             return self.p.map[key]
                         except KeyError:
                             raise KeyError("node " + hex(key))
                 def __setitem__(self, key, val):
                     self.p.map[key] = val
                 def __delitem__(self, key):
                     del self.p.map[key]
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, fp, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     if len(data) == _prereadsize:
                         data += fp.read() # read the rest
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, fp, data, inline):
                     if len(data) == _prereadsize:
                         if util.openhardlinks() and not inline:
                             # big index, let's parse it on demand
                             parser = lazyparser(fp)
                             index = lazyindex(parser)
                             nodemap = lazymap(parser)
                             e = list(index[0])
                             type = gettype(e[0])
                             e[0] = offset_type(0, type)
                             index[0] = e
                             return index, nodemap, None
                         else:
                             data += fp.read()
                     # call the C implementation to parse the index data
                     index, nodemap, cache = parsers.parse_index(data, inline)
                     return index, nodemap, cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._chunkcache = (0, '')
                     self.nodemap = {nullid: nullrev}
                     self.index = []
                     v = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, 'options') and 'defversion' in opener.options:
                         v = opener.options['defversion']
                         if v & REVLOGNG:
                             v |= REVLOGNGINLINEDATA
                     i = ''
                     try:
                         f = self.opener(self.indexfile)
                         if "nonlazy" in getattr(self.opener, 'options', {}):
                             i = f.read()
                         else:
                             i = f.read(_prereadsize)
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNGINLINEDATA:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     if i:
                         try:
                             d = self._io.parseindex(f, i, self._inline)
                         except (ValueError, IndexError):
                             raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                         self.index, self.nodemap, self._chunkcache = d
                         if not self._chunkcache:
                             self._chunkclear()
                     # add the magic null revision at -1 (if it hasn't been done already)
                     if (self.index == [] or isinstance(self.index, lazyindex) or
                         self.index[-1][7] != nullid) :
                         self.index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                 def _loadindex(self, start, end):
                     """load a block of indexes all at once from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         self.index.p.loadindex(start, end)
                 def _loadindexmap(self):
                     """loads both the map and the index from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         p = self.index.p
                         p.loadindex()
                         self.nodemap = p.map
                 def _loadmap(self):
                     """loads the map from the lazy parser"""
                     if isinstance(self.nodemap, lazymap):
                         self.nodemap.p.loadmap()
                         self.nodemap = self.nodemap.p.map
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     for i in xrange(len(self)):
                         yield i
                 def rev(self, node):
                     try:
                         return self.nodemap[node]
                     except KeyError:
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def base(self, rev):
                     return self.index[rev][3]
                 def size(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 def reachable(self, node, stop=None):
                     """return the set of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = set((node,))
                     visit = [node]
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable.add(p)
                                 visit.append(p)
                     return reachable
                 def ancestors(self, *revs):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Yield a sequence of revision numbers starting with the parents
                     of each revision in revs, i.e., each revision is *not* considered
                     an ancestor of itself.  Results are in breadth-first order:
                     parents of each rev in revs, then parents of those, etc.  Result
                     does not include the null revision."""
                     visit = list(revs)
                     seen = set([nullrev])
                     while visit:
                         for parent in self.parentrevs(visit.pop(0)):
                             if parent not in seen:
                                 visit.append(parent)
                                 seen.add(parent)
                                 yield parent
                 def descendants(self, *revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     seen = set(revs)
                     for i in xrange(min(revs) + 1, len(self)):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     has = set(self.ancestors(*common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = [r for r in heads if r not in has]
                     while visit:
                         r = visit.pop(0)
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return [self.node(r) for r in missing]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, 0)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendents = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents.add(n)
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = 1
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = 1
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n in heads.iterkeys() if heads[n] != 0]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         count = len(self)
                         if not count:
                             return [nullid]
                         ishead = [1] * (count + 1)
                         index = self.index
                         for r in xrange(count):
                             e = index[r]
                             ishead[e[5]] = ishead[e[6]] = 0
                         return [self.node(r) for r in xrange(count) if ishead[r]]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, len(self)):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, len(self)):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     for i in self.descendants(start):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # fast path, check if it is a descendant
                     a, b = self.rev(a), self.rev(b)
                     start, end = sorted((a, b))
                     if self.descendant(start, end):
                         return self.node(start)
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(a, b, parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             bin_id = bin(id[:l * 2])
                             nl = [n for n in self.nodemap if n[:l] == bin_id]
                             nl = [n for n in nl if hex(n).startswith(id)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _prereadsize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     readahead = max(65536, length)
                     df.seek(offset)
                     d = df.read(readahead)
                     self._addchunk(offset, d)
                     if readahead > length:
                         return d[:length]
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return d[cachestart:cacheend]
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     length = self.end(endrev) - start
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 + 1 == rev2 and self.base(rev1) == self.base(rev2):
                         return self._chunk(rev2)
                     return mdiff.textdiff(self.revision(self.node(rev1)),
                                           self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given node"""
                     if node == nullid:
                         return ""
                     if self._cache and self._cache[0] == node:
                         return self._cache[2]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     # check rev flags
                     if self.index[rev][0] & 0xFFFF:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.index[rev][0] & 0xFFFF))
                     # do we have useful data cached?
                     if self._cache and self._cache[1] >= base and self._cache[1] < rev:
                         base = self._cache[1]
                         text = self._cache[2]
                     self._loadindex(base, rev + 1)
                     self._chunkraw(base, rev)
                     if text is None:
                         text = self._chunk(base)
                     bins = [self._chunk(r) for r in xrange(base + 1, rev + 1)]
                     text = mdiff.patches(text, bins)
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.indexfile, rev))
                     self._cache = (node, rev, text)
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, d=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     d - an optional precomputed delta
                     """
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     curr = len(self)
                     prev = curr - 1
                     base = self.base(prev)
                     offset = self.end(prev)
                     if curr:
                         if not d:
                             ptext = self.revision(self.node(prev))
                             d = mdiff.textdiff(ptext, text)
                         data = compress(d)
                         l = len(data[1]) + len(data[0])
                         dist = l + offset - self.start(base)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if not curr or dist > len(text) * 2:
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = curr
                     e = (offset_type(offset, 0), l, len(text),
                          base, link, self.rev(p1), self.rev(p2), node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     return node
                 def group(self, nodelist, lookup, infocollect=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. the first delta is
                     parent(nodes[0]) -> nodes[0] the receiver is guaranteed to
                     have this parent as it has all history before these
                     changesets. parent is parent[0]
                     """
                     revs = [self.rev(n) for n in nodelist]
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield changegroup.closechunk()
                         return
                     # add the parent of the first rev
                     p = self.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     for d in xrange(len(revs) - 1):
                         a, b = revs[d], revs[d + 1]
                         nb = self.node(b)
                         if infocollect is not None:
                             infocollect(nb)
                         p = self.parents(nb)
                         meta = nb + p[0] + p[1] + lookup(nb)
                         if a == -1:
                             d = self.revision(nb)
                             meta += mdiff.trivialdiffheader(len(d))
                         else:
                             d = self.revdiff(a, b)
                         yield changegroup.chunkheader(len(meta) + len(d))
                         yield meta
-                        if len(d) > 2**20:
+                        yield d
-                            pos = 0
-                            while pos < len(d):
-                                pos2 = pos + 2 ** 18
-                                yield d[pos:pos2]
-                                pos = pos2
-                        else:
-                            yield d
                     yield changegroup.closechunk()
                 def addgroup(self, revs, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     #track the base of the current delta log
                     r = len(self)
                     t = r - 1
                     node = None
                     base = prev = nullrev
                     start = end = textlen = 0
                     if r:
                         end = self.end(t)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         for chunk in revs:
                             node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             delta = buffer(chunk, 80)
                             del chunk
                             for p in (p1, p2):
                                 if not p in self.nodemap:
                                     raise LookupError(p, self.indexfile, _('unknown parent'))
                             if not chain:
                                 # retrieve the parent revision of the delta chain
                                 chain = p1
                                 if not chain in self.nodemap:
                                     raise LookupError(chain, self.indexfile, _('unknown base'))
                             # full versions are inserted when the needed deltas become
                             # comparable to the uncompressed text or when the previous
                             # version is not the one we have a delta against. We use
                             # the size of the previous full rev as a proxy for the
                             # current size.
                             if chain == prev:
                                 cdelta = compress(delta)
                                 cdeltalen = len(cdelta[0]) + len(cdelta[1])
                                 textlen = mdiff.patchedsize(textlen, delta)
                             if chain != prev or (end - start + cdeltalen) > textlen * 2:
                                 # flush our writes here so we can read it in revision
                                 if dfh:
                                     dfh.flush()
                                 ifh.flush()
                                 text = self.revision(chain)
                                 if len(text) == 0:
                                     # skip over trivial delta header
                                     text = buffer(delta, 12)
                                 else:
                                     text = mdiff.patches(text, [delta])
                                 del delta
                                 chk = self._addrevision(text, transaction, link, p1, p2, None,
                                                         ifh, dfh)
                                 if not dfh and not self._inline:
                                     # addrevision switched from inline to conventional
                                     # reopen the index
                                     dfh = self.opener(self.datafile, "a")
                                     ifh = self.opener(self.indexfile, "a")
                                 if chk != node:
                                     raise RevlogError(_("consistency error adding group"))
                                 textlen = len(text)
                             else:
                                 e = (offset_type(end, 0), cdeltalen, textlen, base,
                                      link, self.rev(p1), self.rev(p2), node)
                                 self.index.insert(-1, e)
                                 self.nodemap[node] = r
                                 entry = self._io.packentry(e, self.node, self.version, r)
                                 if self._inline:
                                     ifh.write(entry)
                                     ifh.write(cdelta[0])
                                     ifh.write(cdelta[1])
                                     self.checkinlinesize(transaction, ifh)
                                     if not self._inline:
                                         dfh = self.opener(self.datafile, "a")
                                         ifh = self.opener(self.indexfile, "a")
                                 else:
                                     dfh.write(cdelta[0])
                                     dfh.write(cdelta[1])
                                     ifh.write(entry)
                             t, r, chain, prev = r, r + 1, node, node
                             base = self.base(t)
                             start = self.start(base)
                             end = self.end(t)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return node
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll readd them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     if isinstance(self.index, lazyindex):
                         self._loadindexmap()
                     for rev in self:
                         if self.index[rev][4] >= minlink:
                             break
                     else:
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res

mercurial/util.py

0 +11 -1

             # util.py - Mercurial utility functions and platform specfic implementations
             #
             #  Copyright 2005 K. Thananchayan <thananck@yahoo.com>
             #  Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #  Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Mercurial utility functions and platform specfic implementations.
             This contains helper routines that are independent of the SCM core and
             hide platform-specific details from the core.
             """
             from i18n import _
             import error, osutil, encoding
             import errno, re, shutil, sys, tempfile, traceback
             import os, stat, time, calendar, textwrap, unicodedata, signal
             import imp
             # Python compatibility
             def sha1(s):
                 return _fastsha1(s)
             def _fastsha1(s):
                 # This function will import sha1 from hashlib or sha (whichever is
                 # available) and overwrite itself with it on the first call.
                 # Subsequent calls will go directly to the imported function.
                 try:
                     from hashlib import sha1 as _sha1
                 except ImportError:
                     from sha import sha as _sha1
                 global _fastsha1, sha1
                 _fastsha1 = sha1 = _sha1
                 return _sha1(s)
             import __builtin__
             if sys.version_info[0] < 3:
                 def fakebuffer(sliceable, offset=0):
                     return sliceable[offset:]
             else:
                 def fakebuffer(sliceable, offset=0):
                     return memoryview(sliceable)[offset:]
             try:
                 buffer
             except NameError:
                 __builtin__.buffer = fakebuffer
             import subprocess
             closefds = os.name == 'posix'
             def popen2(cmd, env=None, newlines=False):
                 # Setting bufsize to -1 lets the system decide the buffer size.
                 # The default for bufsize is 0, meaning unbuffered. This leads to
                 # poor performance on Mac OS X: http://bugs.python.org/issue4194
                 p = subprocess.Popen(cmd, shell=True, bufsize=-1,
                                      close_fds=closefds,
                                      stdin=subprocess.PIPE, stdout=subprocess.PIPE,
                                      universal_newlines=newlines,
                                      env=env)
                 return p.stdin, p.stdout
             def popen3(cmd, env=None, newlines=False):
                 p = subprocess.Popen(cmd, shell=True, bufsize=-1,
                                      close_fds=closefds,
                                      stdin=subprocess.PIPE, stdout=subprocess.PIPE,
                                      stderr=subprocess.PIPE,
                                      universal_newlines=newlines,
                                      env=env)
                 return p.stdin, p.stdout, p.stderr
             def version():
                 """Return version information if available."""
                 try:
                     import __version__
                     return __version__.version
                 except ImportError:
                     return 'unknown'
             # used by parsedate
             defaultdateformats = (
                 '%Y-%m-%d %H:%M:%S',
                 '%Y-%m-%d %I:%M:%S%p',
                 '%Y-%m-%d %H:%M',
                 '%Y-%m-%d %I:%M%p',
                 '%Y-%m-%d',
                 '%m-%d',
                 '%m/%d',
                 '%m/%d/%y',
                 '%m/%d/%Y',
                 '%a %b %d %H:%M:%S %Y',
                 '%a %b %d %I:%M:%S%p %Y',
                 '%a, %d %b %Y %H:%M:%S',        #  GNU coreutils "/bin/date --rfc-2822"
                 '%b %d %H:%M:%S %Y',
                 '%b %d %I:%M:%S%p %Y',
                 '%b %d %H:%M:%S',
                 '%b %d %I:%M:%S%p',
                 '%b %d %H:%M',
                 '%b %d %I:%M%p',
                 '%b %d %Y',
                 '%b %d',
                 '%H:%M:%S',
                 '%I:%M:%S%p',
                 '%H:%M',
                 '%I:%M%p',
             )
             extendeddateformats = defaultdateformats + (
                 "%Y",
                 "%Y-%m",
                 "%b",
                 "%b %Y",
                 )
             def cachefunc(func):
                 '''cache the result of function calls'''
                 # XXX doesn't handle keywords args
                 cache = {}
                 if func.func_code.co_argcount == 1:
                     # we gain a small amount of time because
                     # we don't need to pack/unpack the list
                     def f(arg):
                         if arg not in cache:
                             cache[arg] = func(arg)
                         return cache[arg]
                 else:
                     def f(*args):
                         if args not in cache:
                             cache[args] = func(*args)
                         return cache[args]
                 return f
             def lrucachefunc(func):
                 '''cache most recent results of function calls'''
                 cache = {}
                 order = []
                 if func.func_code.co_argcount == 1:
                     def f(arg):
                         if arg not in cache:
                             if len(cache) > 20:
                                 del cache[order.pop(0)]
                             cache[arg] = func(arg)
                         else:
                             order.remove(arg)
                         order.append(arg)
                         return cache[arg]
                 else:
                     def f(*args):
                         if args not in cache:
                             if len(cache) > 20:
                                 del cache[order.pop(0)]
                             cache[args] = func(*args)
                         else:
                             order.remove(args)
                         order.append(args)
                         return cache[args]
                 return f
             class propertycache(object):
                 def __init__(self, func):
                     self.func = func
                     self.name = func.__name__
                 def __get__(self, obj, type=None):
                     result = self.func(obj)
                     setattr(obj, self.name, result)
                     return result
             def pipefilter(s, cmd):
                 '''filter string S through command CMD, returning its output'''
                 p = subprocess.Popen(cmd, shell=True, close_fds=closefds,
                                      stdin=subprocess.PIPE, stdout=subprocess.PIPE)
                 pout, perr = p.communicate(s)
                 return pout
             def tempfilter(s, cmd):
                 '''filter string S through a pair of temporary files with CMD.
                 CMD is used as a template to create the real command to be run,
                 with the strings INFILE and OUTFILE replaced by the real names of
                 the temporary files generated.'''
                 inname, outname = None, None
                 try:
                     infd, inname = tempfile.mkstemp(prefix='hg-filter-in-')
                     fp = os.fdopen(infd, 'wb')
                     fp.write(s)
                     fp.close()
                     outfd, outname = tempfile.mkstemp(prefix='hg-filter-out-')
                     os.close(outfd)
                     cmd = cmd.replace('INFILE', inname)
                     cmd = cmd.replace('OUTFILE', outname)
                     code = os.system(cmd)
                     if sys.platform == 'OpenVMS' and code & 1:
                         code = 0
                     if code:
                         raise Abort(_("command '%s' failed: %s") %
                                     (cmd, explain_exit(code)))
                     return open(outname, 'rb').read()
                 finally:
                     try:
                         if inname:
                             os.unlink(inname)
                     except:
                         pass
                     try:
                         if outname:
                             os.unlink(outname)
                     except:
                         pass
             filtertable = {
                 'tempfile:': tempfilter,
                 'pipe:': pipefilter,
                 }
             def filter(s, cmd):
                 "filter a string through a command that transforms its input to its output"
                 for name, fn in filtertable.iteritems():
                     if cmd.startswith(name):
                         return fn(s, cmd[len(name):].lstrip())
                 return pipefilter(s, cmd)
             def binary(s):
                 """return true if a string is binary data"""
                 return bool(s and '\0' in s)
             def increasingchunks(source, min=1024, max=65536):
                 '''return no less than min bytes per chunk while data remains,
                 doubling min after each chunk until it reaches max'''
                 def log2(x):
                     if not x:
                         return 0
                     i = 0
                     while x:
                         x >>= 1
                         i += 1
                     return i - 1
                 buf = []
                 blen = 0
                 for chunk in source:
                     buf.append(chunk)
                     blen += len(chunk)
                     if blen >= min:
                         if min < max:
                             min = min << 1
                             nmin = 1 << log2(blen)
                             if nmin > min:
                                 min = nmin
                             if min > max:
                                 min = max
                         yield ''.join(buf)
                         blen = 0
                         buf = []
                 if buf:
                     yield ''.join(buf)
             Abort = error.Abort
             def always(fn):
                 return True
             def never(fn):
                 return False
             def pathto(root, n1, n2):
                 '''return the relative path from one place to another.
                 root should use os.sep to separate directories
                 n1 should use os.sep to separate directories
                 n2 should use "/" to separate directories
                 returns an os.sep-separated path.
                 If n1 is a relative path, it's assumed it's
                 relative to root.
                 n2 should always be relative to root.
                 '''
                 if not n1:
                     return localpath(n2)
                 if os.path.isabs(n1):
                     if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
                         return os.path.join(root, localpath(n2))
                     n2 = '/'.join((pconvert(root), n2))
                 a, b = splitpath(n1), n2.split('/')
                 a.reverse()
                 b.reverse()
                 while a and b and a[-1] == b[-1]:
                     a.pop()
                     b.pop()
                 b.reverse()
                 return os.sep.join((['..'] * len(a)) + b) or '.'
             def canonpath(root, cwd, myname):
                 """return the canonical path of myname, given cwd and root"""
                 if endswithsep(root):
                     rootsep = root
                 else:
                     rootsep = root + os.sep
                 name = myname
                 if not os.path.isabs(name):
                     name = os.path.join(root, cwd, name)
                 name = os.path.normpath(name)
                 audit_path = path_auditor(root)
                 if name != rootsep and name.startswith(rootsep):
                     name = name[len(rootsep):]
                     audit_path(name)
                     return pconvert(name)
                 elif name == root:
                     return ''
                 else:
                     # Determine whether `name' is in the hierarchy at or beneath `root',
                     # by iterating name=dirname(name) until that causes no change (can't
                     # check name == '/', because that doesn't work on windows).  For each
                     # `name', compare dev/inode numbers.  If they match, the list `rel'
                     # holds the reversed list of components making up the relative file
                     # name we want.
                     root_st = os.stat(root)
                     rel = []
                     while True:
                         try:
                             name_st = os.stat(name)
                         except OSError:
                             break
                         if samestat(name_st, root_st):
                             if not rel:
                                 # name was actually the same as root (maybe a symlink)
                                 return ''
                             rel.reverse()
                             name = os.path.join(*rel)
                             audit_path(name)
                             return pconvert(name)
                         dirname, basename = os.path.split(name)
                         rel.append(basename)
                         if dirname == name:
                             break
                         name = dirname
                     raise Abort('%s not under root' % myname)
             _hgexecutable = None
             def main_is_frozen():
                 """return True if we are a frozen executable.
                 The code supports py2exe (most common, Windows only) and tools/freeze
                 (portable, not much used).
                 """
                 return (hasattr(sys, "frozen") or # new py2exe
                         hasattr(sys, "importers") or # old py2exe
                         imp.is_frozen("__main__")) # tools/freeze
             def hgexecutable():
                 """return location of the 'hg' executable.
                 Defaults to $HG or 'hg' in the search path.
                 """
                 if _hgexecutable is None:
                     hg = os.environ.get('HG')
                     if hg:
                         set_hgexecutable(hg)
                     elif main_is_frozen():
                         set_hgexecutable(sys.executable)
                     else:
                         exe = find_exe('hg') or os.path.basename(sys.argv[0])
                         set_hgexecutable(exe)
                 return _hgexecutable
             def set_hgexecutable(path):
                 """set location of the 'hg' executable"""
                 global _hgexecutable
                 _hgexecutable = path
             def system(cmd, environ={}, cwd=None, onerr=None, errprefix=None, out=None):
                 '''enhanced shell command execution.
                 run with environment maybe modified, maybe in different dir.
                 if command fails and onerr is None, return status.  if ui object,
                 print error message and return status, else raise onerr object as
                 exception.
                 if out is specified, it is assumed to be a file-like object that has a
                 write() method. stdout and stderr will be redirected to out.'''
                 def py2shell(val):
                     'convert python object into string that is useful to shell'
                     if val is None or val is False:
                         return '0'
                     if val is True:
                         return '1'
                     return str(val)
                 origcmd = cmd
                 if os.name == 'nt':
                     cmd = '"%s"' % cmd
                 env = dict(os.environ)
                 env.update((k, py2shell(v)) for k, v in environ.iteritems())
                 env['HG'] = hgexecutable()
                 if out is None:
                     rc = subprocess.call(cmd, shell=True, close_fds=closefds,
                                          env=env, cwd=cwd)
                 else:
                     proc = subprocess.Popen(cmd, shell=True, close_fds=closefds,
                                             env=env, cwd=cwd, stdout=subprocess.PIPE,
                                             stderr=subprocess.STDOUT)
                     for line in proc.stdout:
                         out.write(line)
                     proc.wait()
                     rc = proc.returncode
                 if sys.platform == 'OpenVMS' and rc & 1:
                     rc = 0
                 if rc and onerr:
                     errmsg = '%s %s' % (os.path.basename(origcmd.split(None, 1)[0]),
                                         explain_exit(rc)[0])
                     if errprefix:
                         errmsg = '%s: %s' % (errprefix, errmsg)
                     try:
                         onerr.warn(errmsg + '\n')
                     except AttributeError:
                         raise onerr(errmsg)
                 return rc
             def checksignature(func):
                 '''wrap a function with code to check for calling errors'''
                 def check(*args, **kwargs):
                     try:
                         return func(*args, **kwargs)
                     except TypeError:
                         if len(traceback.extract_tb(sys.exc_info()[2])) == 1:
                             raise error.SignatureError
                         raise
                 return check
             # os.path.lexists is not available on python2.3
             def lexists(filename):
                 "test whether a file with this name exists. does not follow symlinks"
                 try:
                     os.lstat(filename)
                 except:
                     return False
                 return True
             def unlink(f):
                 """unlink and remove the directory if it is empty"""
                 os.unlink(f)
                 # try removing directories that might now be empty
                 try:
                     os.removedirs(os.path.dirname(f))
                 except OSError:
                     pass
             def copyfile(src, dest):
                 "copy a file, preserving mode and atime/mtime"
                 if os.path.islink(src):
                     try:
                         os.unlink(dest)
                     except:
                         pass
                     os.symlink(os.readlink(src), dest)
                 else:
                     try:
                         shutil.copyfile(src, dest)
                         shutil.copystat(src, dest)
                     except shutil.Error, inst:
                         raise Abort(str(inst))
             def copyfiles(src, dst, hardlink=None):
                 """Copy a directory tree using hardlinks if possible"""
                 if hardlink is None:
                     hardlink = (os.stat(src).st_dev ==
                                 os.stat(os.path.dirname(dst)).st_dev)
                 num = 0
                 if os.path.isdir(src):
                     os.mkdir(dst)
                     for name, kind in osutil.listdir(src):
                         srcname = os.path.join(src, name)
                         dstname = os.path.join(dst, name)
                         hardlink, n = copyfiles(srcname, dstname, hardlink)
                         num += n
                 else:
                     if hardlink:
                         try:
                             os_link(src, dst)
                         except (IOError, OSError):
                             hardlink = False
                             shutil.copy(src, dst)
                     else:
                         shutil.copy(src, dst)
                     num += 1
                 return hardlink, num
             class path_auditor(object):
                 '''ensure that a filesystem path contains no banned components.
                 the following properties of a path are checked:
                 - under top-level .hg
                 - starts at the root of a windows drive
                 - contains ".."
                 - traverses a symlink (e.g. a/symlink_here/b)
                 - inside a nested repository'''
                 def __init__(self, root):
                     self.audited = set()
                     self.auditeddir = set()
                     self.root = root
                 def __call__(self, path):
                     if path in self.audited:
                         return
                     normpath = os.path.normcase(path)
                     parts = splitpath(normpath)
                     if (os.path.splitdrive(path)[0]
                         or parts[0].lower() in ('.hg', '.hg.', '')
                         or os.pardir in parts):
                         raise Abort(_("path contains illegal component: %s") % path)
                     if '.hg' in path.lower():
                         lparts = [p.lower() for p in parts]
                         for p in '.hg', '.hg.':
                             if p in lparts[1:]:
                                 pos = lparts.index(p)
                                 base = os.path.join(*parts[:pos])
                                 raise Abort(_('path %r is inside repo %r') % (path, base))
                     def check(prefix):
                         curpath = os.path.join(self.root, prefix)
                         try:
                             st = os.lstat(curpath)
                         except OSError, err:
                             # EINVAL can be raised as invalid path syntax under win32.
                             # They must be ignored for patterns can be checked too.
                             if err.errno not in (errno.ENOENT, errno.ENOTDIR, errno.EINVAL):
                                 raise
                         else:
                             if stat.S_ISLNK(st.st_mode):
                                 raise Abort(_('path %r traverses symbolic link %r') %
                                             (path, prefix))
                             elif (stat.S_ISDIR(st.st_mode) and
                                   os.path.isdir(os.path.join(curpath, '.hg'))):
                                 raise Abort(_('path %r is inside repo %r') %
                                             (path, prefix))
                     parts.pop()
                     prefixes = []
                     while parts:
                         prefix = os.sep.join(parts)
                         if prefix in self.auditeddir:
                             break
                         check(prefix)
                         prefixes.append(prefix)
                         parts.pop()
                     self.audited.add(path)
                     # only add prefixes to the cache after checking everything: we don't
                     # want to add "foo/bar/baz" before checking if there's a "foo/.hg"
                     self.auditeddir.update(prefixes)
             def nlinks(pathname):
                 """Return number of hardlinks for the given file."""
                 return os.lstat(pathname).st_nlink
             if hasattr(os, 'link'):
                 os_link = os.link
             else:
                 def os_link(src, dst):
                     raise OSError(0, _("Hardlinks not supported"))
             def lookup_reg(key, name=None, scope=None):
                 return None
             def hidewindow():
                 """Hide current shell window.
                 Used to hide the window opened when starting asynchronous
                 child process under Windows, unneeded on other systems.
                 """
                 pass
             if os.name == 'nt':
                 from windows import *
             else:
                 from posix import *
             def makelock(info, pathname):
                 try:
                     return os.symlink(info, pathname)
                 except OSError, why:
                     if why.errno == errno.EEXIST:
                         raise
                 except AttributeError: # no symlink in os
                     pass
                 ld = os.open(pathname, os.O_CREAT | os.O_WRONLY | os.O_EXCL)
                 os.write(ld, info)
                 os.close(ld)
             def readlock(pathname):
                 try:
                     return os.readlink(pathname)
                 except OSError, why:
                     if why.errno not in (errno.EINVAL, errno.ENOSYS):
                         raise
                 except AttributeError: # no symlink in os
                     pass
                 return posixfile(pathname).read()
             def fstat(fp):
                 '''stat file object that may not have fileno method.'''
                 try:
                     return os.fstat(fp.fileno())
                 except AttributeError:
                     return os.stat(fp.name)
             # File system features
             def checkcase(path):
                 """
                 Check whether the given path is on a case-sensitive filesystem
                 Requires a path (like /foo/.hg) ending with a foldable final
                 directory component.
                 """
                 s1 = os.stat(path)
                 d, b = os.path.split(path)
                 p2 = os.path.join(d, b.upper())
                 if path == p2:
                     p2 = os.path.join(d, b.lower())
                 try:
                     s2 = os.stat(p2)
                     if s2 == s1:
                         return False
                     return True
                 except:
                     return True
             _fspathcache = {}
             def fspath(name, root):
                 '''Get name in the case stored in the filesystem
                 The name is either relative to root, or it is an absolute path starting
                 with root. Note that this function is unnecessary, and should not be
                 called, for case-sensitive filesystems (simply because it's expensive).
                 '''
                 # If name is absolute, make it relative
                 if name.lower().startswith(root.lower()):
                     l = len(root)
                     if name[l] == os.sep or name[l] == os.altsep:
                         l = l + 1
                     name = name[l:]
                 if not os.path.exists(os.path.join(root, name)):
                     return None
                 seps = os.sep
                 if os.altsep:
                     seps = seps + os.altsep
                 # Protect backslashes. This gets silly very quickly.
                 seps.replace('\\','\\\\')
                 pattern = re.compile(r'([^%s]+)|([%s]+)' % (seps, seps))
                 dir = os.path.normcase(os.path.normpath(root))
                 result = []
                 for part, sep in pattern.findall(name):
                     if sep:
                         result.append(sep)
                         continue
                     if dir not in _fspathcache:
                         _fspathcache[dir] = os.listdir(dir)
                     contents = _fspathcache[dir]
                     lpart = part.lower()
                     lenp = len(part)
                     for n in contents:
                         if lenp == len(n) and n.lower() == lpart:
                             result.append(n)
                             break
                     else:
                         # Cannot happen, as the file exists!
                         result.append(part)
                     dir = os.path.join(dir, lpart)
                 return ''.join(result)
             def checkexec(path):
                 """
                 Check whether the given path is on a filesystem with UNIX-like exec flags
                 Requires a directory (like /foo/.hg)
                 """
                 # VFAT on some Linux versions can flip mode but it doesn't persist
                 # a FS remount. Frequently we can detect it if files are created
                 # with exec bit on.
                 try:
                     EXECFLAGS = stat.S_IXUSR | stat.S_IXGRP | stat.S_IXOTH
                     fh, fn = tempfile.mkstemp(dir=path, prefix='hg-checkexec-')
                     try:
                         os.close(fh)
                         m = os.stat(fn).st_mode & 0777
                         new_file_has_exec = m & EXECFLAGS
                         os.chmod(fn, m ^ EXECFLAGS)
                         exec_flags_cannot_flip = ((os.stat(fn).st_mode & 0777) == m)
                     finally:
                         os.unlink(fn)
                 except (IOError, OSError):
                     # we don't care, the user probably won't be able to commit anyway
                     return False
                 return not (new_file_has_exec or exec_flags_cannot_flip)
             def checklink(path):
                 """check whether the given path is on a symlink-capable filesystem"""
                 # mktemp is not racy because symlink creation will fail if the
                 # file already exists
                 name = tempfile.mktemp(dir=path, prefix='hg-checklink-')
                 try:
                     os.symlink(".", name)
                     os.unlink(name)
                     return True
                 except (OSError, AttributeError):
                     return False
             def needbinarypatch():
                 """return True if patches should be applied in binary mode by default."""
                 return os.name == 'nt'
             def endswithsep(path):
                 '''Check path ends with os.sep or os.altsep.'''
                 return path.endswith(os.sep) or os.altsep and path.endswith(os.altsep)
             def splitpath(path):
                 '''Split path by os.sep.
                 Note that this function does not use os.altsep because this is
                 an alternative of simple "xxx.split(os.sep)".
                 It is recommended to use os.path.normpath() before using this
                 function if need.'''
                 return path.split(os.sep)
             def gui():
                 '''Are we running in a GUI?'''
                 return os.name == "nt" or os.name == "mac" or os.environ.get("DISPLAY")
             def mktempcopy(name, emptyok=False, createmode=None):
                 """Create a temporary file with the same contents from name
                 The permission bits are copied from the original file.
                 If the temporary file is going to be truncated immediately, you
                 can use emptyok=True as an optimization.
                 Returns the name of the temporary file.
                 """
                 d, fn = os.path.split(name)
                 fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, dir=d)
                 os.close(fd)
                 # Temporary files are created with mode 0600, which is usually not
                 # what we want.  If the original file already exists, just copy
                 # its mode.  Otherwise, manually obey umask.
                 try:
                     st_mode = os.lstat(name).st_mode & 0777
                 except OSError, inst:
                     if inst.errno != errno.ENOENT:
                         raise
                     st_mode = createmode
                     if st_mode is None:
                         st_mode = ~umask
                     st_mode &= 0666
                 os.chmod(temp, st_mode)
                 if emptyok:
                     return temp
                 try:
                     try:
                         ifp = posixfile(name, "rb")
                     except IOError, inst:
                         if inst.errno == errno.ENOENT:
                             return temp
                         if not getattr(inst, 'filename', None):
                             inst.filename = name
                         raise
                     ofp = posixfile(temp, "wb")
                     for chunk in filechunkiter(ifp):
                         ofp.write(chunk)
                     ifp.close()
                     ofp.close()
                 except:
                     try: os.unlink(temp)
                     except: pass
                     raise
                 return temp
             class atomictempfile(object):
                 """file-like object that atomically updates a file
                 All writes will be redirected to a temporary copy of the original
                 file.  When rename is called, the copy is renamed to the original
                 name, making the changes visible.
                 """
                 def __init__(self, name, mode='w+b', createmode=None):
                     self.__name = name
                     self._fp = None
                     self.temp = mktempcopy(name, emptyok=('w' in mode),
                                            createmode=createmode)
                     self._fp = posixfile(self.temp, mode)
                 def __getattr__(self, name):
                     return getattr(self._fp, name)
                 def rename(self):
                     if not self._fp.closed:
                         self._fp.close()
                         rename(self.temp, localpath(self.__name))
                 def __del__(self):
                     if not self._fp:
                         return
                     if not self._fp.closed:
                         try:
                             os.unlink(self.temp)
                         except: pass
                         self._fp.close()
             def makedirs(name, mode=None):
                 """recursive directory creation with parent mode inheritance"""
                 try:
                     os.mkdir(name)
                     if mode is not None:
                         os.chmod(name, mode)
                     return
                 except OSError, err:
                     if err.errno == errno.EEXIST:
                         return
                     if err.errno != errno.ENOENT:
                         raise
                 parent = os.path.abspath(os.path.dirname(name))
                 makedirs(parent, mode)
                 makedirs(name, mode)
             class opener(object):
                 """Open files relative to a base directory
                 This class is used to hide the details of COW semantics and
                 remote file access from higher level code.
                 """
                 def __init__(self, base, audit=True):
                     self.base = base
                     if audit:
                         self.audit_path = path_auditor(base)
                     else:
                         self.audit_path = always
                     self.createmode = None
                 @propertycache
                 def _can_symlink(self):
                     return checklink(self.base)
                 def _fixfilemode(self, name):
                     if self.createmode is None:
                         return
                     os.chmod(name, self.createmode & 0666)
                 def __call__(self, path, mode="r", text=False, atomictemp=False):
                     self.audit_path(path)
                     f = os.path.join(self.base, path)
                     if not text and "b" not in mode:
                         mode += "b" # for that other OS
                     nlink = -1
                     if mode not in ("r", "rb"):
                         try:
                             nlink = nlinks(f)
                         except OSError:
                             nlink = 0
                             d = os.path.dirname(f)
                             if not os.path.isdir(d):
                                 makedirs(d, self.createmode)
                         if atomictemp:
                             return atomictempfile(f, mode, self.createmode)
                         if nlink > 1:
                             rename(mktempcopy(f), f)
                     fp = posixfile(f, mode)
                     if nlink == 0:
                         self._fixfilemode(f)
                     return fp
                 def symlink(self, src, dst):
                     self.audit_path(dst)
                     linkname = os.path.join(self.base, dst)
                     try:
                         os.unlink(linkname)
                     except OSError:
                         pass
                     dirname = os.path.dirname(linkname)
                     if not os.path.exists(dirname):
                         makedirs(dirname, self.createmode)
                     if self._can_symlink:
                         try:
                             os.symlink(src, linkname)
                         except OSError, err:
                             raise OSError(err.errno, _('could not symlink to %r: %s') %
                                           (src, err.strerror), linkname)
                     else:
                         f = self(dst, "w")
                         f.write(src)
                         f.close()
                         self._fixfilemode(dst)
             class chunkbuffer(object):
                 """Allow arbitrary sized chunks of data to be efficiently read from an
                 iterator over chunks of arbitrary size."""
                 def __init__(self, in_iter):
                     """in_iter is the iterator that's iterating over the input chunks.
                     targetsize is how big a buffer to try to maintain."""
-                    self.iter = iter(in_iter)
+                    def splitbig(chunks):
+                        for chunk in chunks:
+                            if len(chunk) > 2**20:
+                                pos = 0
+                                while pos < len(chunk):
+                                    end = pos + 2 ** 18
+                                    yield chunk[pos:end]
+                                    pos = end
+                            else:
+                                yield chunk
+                    self.iter = splitbig(in_iter)
                     self.buf = ''
                 def read(self, l):
                     """Read L bytes of data from the iterator of chunks of data.
                     Returns less than L bytes if the iterator runs dry."""
                     if l > len(self.buf) and self.iter:
                         # Clamp to a multiple of 2**16
                         targetsize = max(l, 2**16)
                         collector = [str(self.buf)]
                         collected = len(self.buf)
                         for chunk in self.iter:
                             collector.append(chunk)
                             collected += len(chunk)
                             if collected >= targetsize:
                                 break
                         else:
                             self.iter = False
                         self.buf = ''.join(collector)
                     if len(self.buf) == l:
                         s, self.buf = str(self.buf), ''
                     else:
                         s, self.buf = self.buf[:l], buffer(self.buf, l)
                     return s
             def filechunkiter(f, size=65536, limit=None):
                 """Create a generator that produces the data in the file size
                 (default 65536) bytes at a time, up to optional limit (default is
                 to read all data).  Chunks may be less than size bytes if the
                 chunk is the last chunk in the file, or the file is a socket or
                 some other type of file that sometimes reads less data than is
                 requested."""
                 assert size >= 0
                 assert limit is None or limit >= 0
                 while True:
                     if limit is None:
                         nbytes = size
                     else:
                         nbytes = min(limit, size)
                     s = nbytes and f.read(nbytes)
                     if not s:
                         break
                     if limit:
                         limit -= len(s)
                     yield s
             def makedate():
                 lt = time.localtime()
                 if lt[8] == 1 and time.daylight:
                     tz = time.altzone
                 else:
                     tz = time.timezone
                 return time.mktime(lt), tz
             def datestr(date=None, format='%a %b %d %H:%M:%S %Y %1%2'):
                 """represent a (unixtime, offset) tuple as a localized time.
                 unixtime is seconds since the epoch, and offset is the time zone's
                 number of seconds away from UTC. if timezone is false, do not
                 append time zone to string."""
                 t, tz = date or makedate()
                 if "%1" in format or "%2" in format:
                     sign = (tz > 0) and "-" or "+"
                     minutes = abs(tz) // 60
                     format = format.replace("%1", "%c%02d" % (sign, minutes // 60))
                     format = format.replace("%2", "%02d" % (minutes % 60))
                 s = time.strftime(format, time.gmtime(float(t) - tz))
                 return s
             def shortdate(date=None):
                 """turn (timestamp, tzoff) tuple into iso 8631 date."""
                 return datestr(date, format='%Y-%m-%d')
             def strdate(string, format, defaults=[]):
                 """parse a localized time string and return a (unixtime, offset) tuple.
                 if the string cannot be parsed, ValueError is raised."""
                 def timezone(string):
                     tz = string.split()[-1]
                     if tz[0] in "+-" and len(tz) == 5 and tz[1:].isdigit():
                         sign = (tz[0] == "+") and 1 or -1
                         hours = int(tz[1:3])
                         minutes = int(tz[3:5])
                         return -sign * (hours * 60 + minutes) * 60
                     if tz == "GMT" or tz == "UTC":
                         return 0
                     return None
                 # NOTE: unixtime = localunixtime + offset
                 offset, date = timezone(string), string
                 if offset != None:
                     date = " ".join(string.split()[:-1])
                 # add missing elements from defaults
                 for part in defaults:
                     found = [True for p in part if ("%"+p) in format]
                     if not found:
                         date += "@" + defaults[part]
                         format += "@%" + part[0]
                 timetuple = time.strptime(date, format)
                 localunixtime = int(calendar.timegm(timetuple))
                 if offset is None:
                     # local timezone
                     unixtime = int(time.mktime(timetuple))
                     offset = unixtime - localunixtime
                 else:
                     unixtime = localunixtime + offset
                 return unixtime, offset
             def parsedate(date, formats=None, defaults=None):
                 """parse a localized date/time string and return a (unixtime, offset) tuple.
                 The date may be a "unixtime offset" string or in one of the specified
                 formats. If the date already is a (unixtime, offset) tuple, it is returned.
                 """
                 if not date:
                     return 0, 0
                 if isinstance(date, tuple) and len(date) == 2:
                     return date
                 if not formats:
                     formats = defaultdateformats
                 date = date.strip()
                 try:
                     when, offset = map(int, date.split(' '))
                 except ValueError:
                     # fill out defaults
                     if not defaults:
                         defaults = {}
                     now = makedate()
                     for part in "d mb yY HI M S".split():
                         if part not in defaults:
                             if part[0] in "HMS":
                                 defaults[part] = "00"
                             else:
                                 defaults[part] = datestr(now, "%" + part[0])
                     for format in formats:
                         try:
                             when, offset = strdate(date, format, defaults)
                         except (ValueError, OverflowError):
                             pass
                         else:
                             break
                     else:
                         raise Abort(_('invalid date: %r ') % date)
                 # validate explicit (probably user-specified) date and
                 # time zone offset. values must fit in signed 32 bits for
                 # current 32-bit linux runtimes. timezones go from UTC-12
                 # to UTC+14
                 if abs(when) > 0x7fffffff:
                     raise Abort(_('date exceeds 32 bits: %d') % when)
                 if offset < -50400 or offset > 43200:
                     raise Abort(_('impossible time zone offset: %d') % offset)
                 return when, offset
             def matchdate(date):
                 """Return a function that matches a given date match specifier
                 Formats include:
                 '{date}' match a given date to the accuracy provided
                 '<{date}' on or before a given date
                 '>{date}' on or after a given date
                 """
                 def lower(date):
                     d = dict(mb="1", d="1")
                     return parsedate(date, extendeddateformats, d)[0]
                 def upper(date):
                     d = dict(mb="12", HI="23", M="59", S="59")
                     for days in "31 30 29".split():
                         try:
                             d["d"] = days
                             return parsedate(date, extendeddateformats, d)[0]
                         except:
                             pass
                     d["d"] = "28"
                     return parsedate(date, extendeddateformats, d)[0]
                 date = date.strip()
                 if date[0] == "<":
                     when = upper(date[1:])
                     return lambda x: x <= when
                 elif date[0] == ">":
                     when = lower(date[1:])
                     return lambda x: x >= when
                 elif date[0] == "-":
                     try:
                         days = int(date[1:])
                     except ValueError:
                         raise Abort(_("invalid day spec: %s") % date[1:])
                     when = makedate()[0] - days * 3600 * 24
                     return lambda x: x >= when
                 elif " to " in date:
                     a, b = date.split(" to ")
                     start, stop = lower(a), upper(b)
                     return lambda x: x >= start and x <= stop
                 else:
                     start, stop = lower(date), upper(date)
                     return lambda x: x >= start and x <= stop
             def shortuser(user):
                 """Return a short representation of a user name or email address."""
                 f = user.find('@')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('<')
                 if f >= 0:
                     user = user[f + 1:]
                 f = user.find(' ')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('.')
                 if f >= 0:
                     user = user[:f]
                 return user
             def email(author):
                 '''get email of author.'''
                 r = author.find('>')
                 if r == -1:
                     r = None
                 return author[author.find('<') + 1:r]
             def ellipsis(text, maxlength=400):
                 """Trim string to at most maxlength (default: 400) characters."""
                 if len(text) <= maxlength:
                     return text
                 else:
                     return "%s..." % (text[:maxlength - 3])
             def walkrepos(path, followsym=False, seen_dirs=None, recurse=False):
                 '''yield every hg repository under path, recursively.'''
                 def errhandler(err):
                     if err.filename == path:
                         raise err
                 if followsym and hasattr(os.path, 'samestat'):
                     def _add_dir_if_not_there(dirlst, dirname):
                         match = False
                         samestat = os.path.samestat
                         dirstat = os.stat(dirname)
                         for lstdirstat in dirlst:
                             if samestat(dirstat, lstdirstat):
                                 match = True
                                 break
                         if not match:
                             dirlst.append(dirstat)
                         return not match
                 else:
                     followsym = False
                 if (seen_dirs is None) and followsym:
                     seen_dirs = []
                     _add_dir_if_not_there(seen_dirs, path)
                 for root, dirs, files in os.walk(path, topdown=True, onerror=errhandler):
                     dirs.sort()
                     if '.hg' in dirs:
                         yield root # found a repository
                         qroot = os.path.join(root, '.hg', 'patches')
                         if os.path.isdir(os.path.join(qroot, '.hg')):
                             yield qroot # we have a patch queue repo here
                         if recurse:
                             # avoid recursing inside the .hg directory
                             dirs.remove('.hg')
                         else:
                             dirs[:] = [] # don't descend further
                     elif followsym:
                         newdirs = []
                         for d in dirs:
                             fname = os.path.join(root, d)
                             if _add_dir_if_not_there(seen_dirs, fname):
                                 if os.path.islink(fname):
                                     for hgname in walkrepos(fname, True, seen_dirs):
                                         yield hgname
                                 else:
                                     newdirs.append(d)
                         dirs[:] = newdirs
             _rcpath = None
             def os_rcpath():
                 '''return default os-specific hgrc search path'''
                 path = system_rcpath()
                 path.extend(user_rcpath())
                 path = [os.path.normpath(f) for f in path]
                 return path
             def rcpath():
                 '''return hgrc search path. if env var HGRCPATH is set, use it.
                 for each item in path, if directory, use files ending in .rc,
                 else use item.
                 make HGRCPATH empty to only look in .hg/hgrc of current repo.
                 if no HGRCPATH, use default os-specific path.'''
                 global _rcpath
                 if _rcpath is None:
                     if 'HGRCPATH' in os.environ:
                         _rcpath = []
                         for p in os.environ['HGRCPATH'].split(os.pathsep):
                             if not p:
                                 continue
                             p = expandpath(p)
                             if os.path.isdir(p):
                                 for f, kind in osutil.listdir(p):
                                     if f.endswith('.rc'):
                                         _rcpath.append(os.path.join(p, f))
                             else:
                                 _rcpath.append(p)
                     else:
                         _rcpath = os_rcpath()
                 return _rcpath
             def bytecount(nbytes):
                 '''return byte count formatted as readable string, with units'''
                 units = (
                     (100, 1 << 30, _('%.0f GB')),
                     (10, 1 << 30, _('%.1f GB')),
                     (1, 1 << 30, _('%.2f GB')),
                     (100, 1 << 20, _('%.0f MB')),
                     (10, 1 << 20, _('%.1f MB')),
                     (1, 1 << 20, _('%.2f MB')),
                     (100, 1 << 10, _('%.0f KB')),
                     (10, 1 << 10, _('%.1f KB')),
                     (1, 1 << 10, _('%.2f KB')),
                     (1, 1, _('%.0f bytes')),
                     )
                 for multiplier, divisor, format in units:
                     if nbytes >= divisor * multiplier:
                         return format % (nbytes / float(divisor))
                 return units[-1][2] % nbytes
             def drop_scheme(scheme, path):
                 sc = scheme + ':'
                 if path.startswith(sc):
                     path = path[len(sc):]
                     if path.startswith('//'):
                         if scheme == 'file':
                             i = path.find('/', 2)
                             if i == -1:
                                 return ''
                             # On Windows, absolute paths are rooted at the current drive
                             # root. On POSIX they are rooted at the file system root.
                             if os.name == 'nt':
                                 droot = os.path.splitdrive(os.getcwd())[0] + '/'
                                 path = os.path.join(droot, path[i + 1:])
                             else:
                                 path = path[i:]
                         else:
                             path = path[2:]
                 return path
             def uirepr(s):
                 # Avoid double backslash in Windows path repr()
                 return repr(s).replace('\\\\', '\\')
             #### naming convention of below implementation follows 'textwrap' module
             class MBTextWrapper(textwrap.TextWrapper):
                 def __init__(self, **kwargs):
                     textwrap.TextWrapper.__init__(self, **kwargs)
                 def _cutdown(self, str, space_left):
                     l = 0
                     ucstr = unicode(str, encoding.encoding)
                     w = unicodedata.east_asian_width
                     for i in xrange(len(ucstr)):
                         l += w(ucstr[i]) in 'WFA' and 2 or 1
                         if space_left < l:
                             return (ucstr[:i].encode(encoding.encoding),
                                     ucstr[i:].encode(encoding.encoding))
                     return str, ''
                 # ----------------------------------------
                 # overriding of base class
                 def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):
                     space_left = max(width - cur_len, 1)
                     if self.break_long_words:
                         cut, res = self._cutdown(reversed_chunks[-1], space_left)
                         cur_line.append(cut)
                         reversed_chunks[-1] = res
                     elif not cur_line:
                         cur_line.append(reversed_chunks.pop())
             #### naming convention of above implementation follows 'textwrap' module
             def wrap(line, width=None, initindent='', hangindent=''):
                 if width is None:
                     width = termwidth() - 2
                 maxindent = max(len(hangindent), len(initindent))
                 if width <= maxindent:
                     # adjust for weird terminal size
                     width = max(78, maxindent + 1)
                 wrapper = MBTextWrapper(width=width,
                                         initial_indent=initindent,
                                         subsequent_indent=hangindent)
                 return wrapper.fill(line)
             def iterlines(iterator):
                 for chunk in iterator:
                     for line in chunk.splitlines():
                         yield line
             def expandpath(path):
                 return os.path.expanduser(os.path.expandvars(path))
             def hgcmd():
                 """Return the command used to execute current hg
                 This is different from hgexecutable() because on Windows we want
                 to avoid things opening new shell windows like batch files, so we
                 get either the python call or current executable.
                 """
                 if main_is_frozen():
                     return [sys.executable]
                 return gethgcmd()
             def rundetached(args, condfn):
                 """Execute the argument list in a detached process.
                 condfn is a callable which is called repeatedly and should return
                 True once the child process is known to have started successfully.
                 At this point, the child process PID is returned. If the child
                 process fails to start or finishes before condfn() evaluates to
                 True, return -1.
                 """
                 # Windows case is easier because the child process is either
                 # successfully starting and validating the condition or exiting
                 # on failure. We just poll on its PID. On Unix, if the child
                 # process fails to start, it will be left in a zombie state until
                 # the parent wait on it, which we cannot do since we expect a long
                 # running process on success. Instead we listen for SIGCHLD telling
                 # us our child process terminated.
                 terminated = set()
                 def handler(signum, frame):
                     terminated.add(os.wait())
                 prevhandler = None
                 if hasattr(signal, 'SIGCHLD'):
                     prevhandler = signal.signal(signal.SIGCHLD, handler)
                 try:
                     pid = spawndetached(args)
                     while not condfn():
                         if ((pid in terminated or not testpid(pid))
                             and not condfn()):
                             return -1
                         time.sleep(0.1)
                     return pid
                 finally:
                     if prevhandler is not None:
                         signal.signal(signal.SIGCHLD, prevhandler)
             try:
                 any, all = any, all
             except NameError:
                 def any(iterable):
                     for i in iterable:
                         if i:
                             return True
                     return False
                 def all(iterable):
                     for i in iterable:
                         if not i:
                             return False
                     return True
             def termwidth():
                 if 'COLUMNS' in os.environ:
                     try:
                         return int(os.environ['COLUMNS'])
                     except ValueError:
                         pass
                 return termwidth_()

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages