upstream/mercurial-mirror Commit - r21111:9d28fd79

match: improve documentation - docstrings and more descriptive variable naming...

Mads Kiilerich -

r21111:9d28fd79 default

parent child

mercurial/match.py

0 +116 -86

             # match.py - filename matching
             #
             #  Copyright 2008, 2009 Matt Mackall <mpm@selenic.com> and others
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import re
             import util, pathutil
             from i18n import _
-            def _rematcher(pat):
+            def _rematcher(regex):
-                m = util.compilere(pat)
+                '''compile the regexp with the best available regexp engine and return a
+                matcher function'''
+                m = util.compilere(regex)
                 try:
                     # slightly faster, provided by facebook's re2 bindings
                     return m.test_match
                 except AttributeError:
                     return m.match
-            def _expandsets(pats, ctx):
+            def _expandsets(kindpats, ctx):
-                '''convert set: patterns into a list of files in the given context'''
+                '''Returns the kindpats list with the 'set' patterns expanded.'''
                 fset = set()
                 other = []
-                for kind, expr in pats:
+                for kind, pat in kindpats:
                     if kind == 'set':
                         if not ctx:
                             raise util.Abort("fileset expression with no context")
-                        s = ctx.getfileset(expr)
+                        s = ctx.getfileset(pat)
                         fset.update(s)
                         continue
-                    other.append((kind, expr))
+                    other.append((kind, pat))
                 return fset, other
             class match(object):
                 def __init__(self, root, cwd, patterns, include=[], exclude=[],
                              default='glob', exact=False, auditor=None, ctx=None):
                     """build an object to match a set of file patterns
                     arguments:
                     root - the canonical root of the tree you're matching against
                     cwd - the current working directory, if relevant
                     patterns - patterns to find
-                    include - patterns to include
+                    include - patterns to include (unless they are excluded)
-                    exclude - patterns to exclude
+                    exclude - patterns to exclude (even if they are included)
-                    default - if a pattern in names has no explicit type, assume this one
+                    default - if a pattern in patterns has no explicit type, assume this one
-                    exact - patterns are actually literals
+                    exact - patterns are actually filenames (include/exclude still apply)
                     a pattern is one of:
                     'glob:<glob>' - a glob relative to cwd
                     're:<regexp>' - a regular expression
                     'path:<path>' - a path relative to repository root
                     'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)
                     'relpath:<path>' - a path relative to cwd
                     'relre:<regexp>' - a regexp that needn't match the start of a name
                     'set:<fileset>' - a fileset expression
                     '<something>' - a pattern of the specified default type
                     """
                     self._root = root
                     self._cwd = cwd
                     self._files = [] # exact files and roots of patterns
                     self._anypats = bool(include or exclude)
                     self._ctx = ctx
                     self._always = False
                     if include:
-                        pats = _normalize(include, 'glob', root, cwd, auditor)
+                        kindpats = _normalize(include, 'glob', root, cwd, auditor)
-                        self.includepat, im = _buildmatch(ctx, pats, '(?:/|$)')
+                        self.includepat, im = _buildmatch(ctx, kindpats, '(?:/|$)')
                     if exclude:
-                        pats = _normalize(exclude, 'glob', root, cwd, auditor)
+                        kindpats = _normalize(exclude, 'glob', root, cwd, auditor)
-                        self.excludepat, em = _buildmatch(ctx, pats, '(?:/|$)')
+                        self.excludepat, em = _buildmatch(ctx, kindpats, '(?:/|$)')
                     if exact:
                         if isinstance(patterns, list):
                             self._files = patterns
                         else:
                             self._files = list(patterns)
                         pm = self.exact
                     elif patterns:
-                        pats = _normalize(patterns, default, root, cwd, auditor)
+                        kindpats = _normalize(patterns, default, root, cwd, auditor)
-                        self._files = _roots(pats)
+                        self._files = _roots(kindpats)
-                        self._anypats = self._anypats or _anypats(pats)
+                        self._anypats = self._anypats or _anypats(kindpats)
-                        self.patternspat, pm = _buildmatch(ctx, pats, '$')
+                        self.patternspat, pm = _buildmatch(ctx, kindpats, '$')
                     if patterns or exact:
                         if include:
                             if exclude:
                                 m = lambda f: im(f) and not em(f) and pm(f)
                             else:
                                 m = lambda f: im(f) and pm(f)
                         else:
                             if exclude:
                                 m = lambda f: not em(f) and pm(f)
                             else:
                                 m = pm
                     else:
                         if include:
                             if exclude:
                                 m = lambda f: im(f) and not em(f)
                             else:
                                 m = im
                         else:
                             if exclude:
                                 m = lambda f: not em(f)
                             else:
                                 m = lambda f: True
                                 self._always = True
                     self.matchfn = m
                     self._fmap = set(self._files)
                 def __call__(self, fn):
                     return self.matchfn(fn)
                 def __iter__(self):
                     for f in self._files:
                         yield f
+                # Callbacks related to how the matcher is used by dirstate.walk.
+                # Subscribers to these events must monkeypatch the matcher object.
                 def bad(self, f, msg):
-                    '''callback for each explicit file that can't be
+                    '''Callback from dirstate.walk for each explicit file that can't be
-                    found/accessed, with an error message
+                    found/accessed, with an error message.'''
-                    '''
                     pass
-                # If this is set, it will be called when an explicitly listed directory is
-                # visited.
+                # If an explicitdir is set, it will be called when an explicitly listed
+                # directory is visited.
                 explicitdir = None
-                # If this is set, it will be called when a directory discovered by recursive
-                # traversal is visited.
+                # If an traversedir is set, it will be called when a directory discovered
+                # by recursive traversal is visited.
                 traversedir = None
                 def missing(self, f):
                     pass
-                def exact(self, f):
-                    return f in self._fmap
                 def rel(self, f):
+                    '''Convert repo path back to path that is relative to cwd of matcher.'''
                     return util.pathto(self._root, self._cwd, f)
                 def files(self):
+                    '''Explicitly listed files or patterns or roots:
+                    if no patterns or .always(): empty list,
+                    if exact: list exact files,
+                    if not .anypats(): list all files and dirs,
+                    else: optimal roots'''
                     return self._files
+                def exact(self, f):
+                    '''Returns True if f is in .files().'''
+                    return f in self._fmap
                 def anypats(self):
+                    '''Matcher uses patterns or include/exclude.'''
                     return self._anypats
                 def always(self):
+                    '''Matcher will match everything and .files() will be empty
+                    - optimization might be possible and necessary.'''
                     return self._always
             class exact(match):
                 def __init__(self, root, cwd, files):
                     match.__init__(self, root, cwd, files, exact=True)
             class always(match):
                 def __init__(self, root, cwd):
                     match.__init__(self, root, cwd, [])
                     self._always = True
             class narrowmatcher(match):
                 """Adapt a matcher to work on a subdirectory only.
                 The paths are remapped to remove/insert the path as needed:
                 >>> m1 = match('root', '', ['a.txt', 'sub/b.txt'])
                 >>> m2 = narrowmatcher('sub', m1)
                 >>> bool(m2('a.txt'))
                 False
                 >>> bool(m2('b.txt'))
                 True
                 >>> bool(m2.matchfn('a.txt'))
                 False
                 >>> bool(m2.matchfn('b.txt'))
                 True
                 >>> m2.files()
                 ['b.txt']
                 >>> m2.exact('b.txt')
                 True
                 >>> m2.rel('b.txt')
                 'b.txt'
                 >>> def bad(f, msg):
                 ...     print "%s: %s" % (f, msg)
                 >>> m1.bad = bad
                 >>> m2.bad('x.txt', 'No such file')
                 sub/x.txt: No such file
                 """
                 def __init__(self, path, matcher):
                     self._root = matcher._root
                     self._cwd = matcher._cwd
                     self._path = path
                     self._matcher = matcher
                     self._always = matcher._always
                     self._files = [f[len(path) + 1:] for f in matcher._files
                                    if f.startswith(path + "/")]
                     self._anypats = matcher._anypats
                     self.matchfn = lambda fn: matcher.matchfn(self._path + "/" + fn)
                     self._fmap = set(self._files)
                 def bad(self, f, msg):
                     self._matcher.bad(self._path + "/" + f, msg)
-            def patkind(pat):
+            def patkind(pattern, default=None):
-                return _patsplit(pat, None)[0]
+                '''If pattern is 'kind:pat' with a known kind, return kind.'''
+                return _patsplit(pattern, default)[0]
-            def _patsplit(pat, default):
+            def _patsplit(pattern, default):
-                """Split a string into an optional pattern kind prefix and the
+                """Split a string into the optional pattern kind prefix and the actual
-                actual pattern."""
+                pattern."""
-                if ':' in pat:
+                if ':' in pattern:
-                    kind, val = pat.split(':', 1)
+                    kind, pat = pattern.split(':', 1)
                     if kind in ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',
                                 'listfile', 'listfile0', 'set'):
-                        return kind, val
+                        return kind, pat
-                return default, pat
+                return default, pattern
             def _globre(pat):
-                "convert a glob pattern into a regexp"
+                '''Convert an extended glob string to a regexp string.'''
                 i, n = 0, len(pat)
                 res = ''
                 group = 0
                 escape = re.escape
                 def peek():
                     return i < n and pat[i]
                 while i < n:
                     c = pat[i]
                     i += 1
                     if c not in '*?[{},\\':
                         res += escape(c)
                     elif c == '*':
                         if peek() == '*':
                             i += 1
                             res += '.*'
                         else:
                             res += '[^/]*'
                     elif c == '?':
                         res += '.'
                     elif c == '[':
                         j = i
                         if j < n and pat[j] in '!]':
                             j += 1
                         while j < n and pat[j] != ']':
                             j += 1
                         if j >= n:
                             res += '\\['
                         else:
                             stuff = pat[i:j].replace('\\','\\\\')
                             i = j + 1
                             if stuff[0] == '!':
                                 stuff = '^' + stuff[1:]
                             elif stuff[0] == '^':
                                 stuff = '\\' + stuff
                             res = '%s[%s]' % (res, stuff)
                     elif c == '{':
                         group += 1
                         res += '(?:'
                     elif c == '}' and group:
                         res += ')'
                         group -= 1
                     elif c == ',' and group:
                         res += '|'
                     elif c == '\\':
                         p = peek()
                         if p:
                             i += 1
                             res += escape(p)
                         else:
                             res += escape(c)
                     else:
                         res += escape(c)
                 return res
-            def _regex(kind, name, tail):
+            def _regex(kind, pat, globsuffix):
-                '''convert a pattern into a regular expression'''
+                '''Convert a (normalized) pattern of any kind into a regular expression.
-                if not name:
+                globsuffix is appended to the regexp of globs.'''
+                if not pat:
                     return ''
                 if kind == 're':
-                    return name
+                    return pat
-                elif kind == 'path':
+                if kind == 'path':
-                    return '^' + re.escape(name) + '(?:/|$)'
+                    return '^' + re.escape(pat) + '(?:/|$)'
-                elif kind == 'relglob':
+                if kind == 'relglob':
-                    return '(?:|.*/)' + _globre(name) + tail
+                    return '(?:|.*/)' + _globre(pat) + globsuffix
-                elif kind == 'relpath':
+                if kind == 'relpath':
-                    return re.escape(name) + '(?:/|$)'
+                    return re.escape(pat) + '(?:/|$)'
-                elif kind == 'relre':
+                if kind == 'relre':
-                    if name.startswith('^'):
+                    if pat.startswith('^'):
-                        return name
+                        return pat
-                    return '.*' + name
+                    return '.*' + pat
-                return _globre(name) + tail
+                return _globre(pat) + globsuffix
-            def _buildmatch(ctx, pats, tail):
+            def _buildmatch(ctx, kindpats, globsuffix):
-                fset, pats = _expandsets(pats, ctx)
+                '''Return regexp string and a matcher function for kindpats.
-                if not pats:
+                globsuffix is appended to the regexp of globs.'''
+                fset, kindpats = _expandsets(kindpats, ctx)
+                if not kindpats:
                     return "", fset.__contains__
-                pat, mf = _buildregexmatch(pats, tail)
+                regex, mf = _buildregexmatch(kindpats, globsuffix)
                 if fset:
-                    return pat, lambda f: f in fset or mf(f)
+                    return regex, lambda f: f in fset or mf(f)
-                return pat, mf
+                return regex, mf
-            def _buildregexmatch(pats, tail):
+            def _buildregexmatch(kindpats, globsuffix):
-                """build a matching function from a set of patterns"""
+                """Build a match function from a list of kinds and kindpats,
+                return regexp string and a matcher function."""
                 try:
-                    pat = '(?:%s)' % '|'.join([_regex(k, p, tail) for (k, p) in pats])
+                    regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)
-                    if len(pat) > 20000:
+                                                 for (k, p) in kindpats])
+                    if len(regex) > 20000:
                         raise OverflowError
-                    return pat, _rematcher(pat)
+                    return regex, _rematcher(regex)
                 except OverflowError:
                     # We're using a Python with a tiny regex engine and we
                     # made it explode, so we'll divide the pattern list in two
                     # until it works
-                    l = len(pats)
+                    l = len(kindpats)
                     if l < 2:
                         raise
-                    pata, a = _buildregexmatch(pats[:l//2], tail)
+                    regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)
-                    patb, b = _buildregexmatch(pats[l//2:], tail)
+                    regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)
                     return pat, lambda s: a(s) or b(s)
                 except re.error:
-                    for k, p in pats:
+                    for k, p in kindpats:
                         try:
-                            _rematcher('(?:%s)' % _regex(k, p, tail))
+                            _rematcher('(?:%s)' % _regex(k, p, globsuffix))
                         except re.error:
                             raise util.Abort(_("invalid pattern (%s): %s") % (k, p))
                     raise util.Abort(_("invalid pattern"))
-            def _normalize(names, default, root, cwd, auditor):
+            def _normalize(patterns, default, root, cwd, auditor):
-                pats = []
+                '''Convert 'kind:pat' from the patterns list to tuples with kind and
-                for kind, name in [_patsplit(p, default) for p in names]:
+                normalized and rooted patterns and with listfiles expanded.'''
+                kindpats = []
+                for kind, pat in [_patsplit(p, default) for p in patterns]:
                     if kind in ('glob', 'relpath'):
-                        name = pathutil.canonpath(root, cwd, name, auditor)
+                        pat = pathutil.canonpath(root, cwd, pat, auditor)
                     elif kind in ('relglob', 'path'):
-                        name = util.normpath(name)
+                        pat = util.normpath(pat)
                     elif kind in ('listfile', 'listfile0'):
                         try:
-                            files = util.readfile(name)
+                            files = util.readfile(pat)
                             if kind == 'listfile0':
                                 files = files.split('\0')
                             else:
                                 files = files.splitlines()
                             files = [f for f in files if f]
                         except EnvironmentError:
-                            raise util.Abort(_("unable to read file list (%s)") % name)
+                            raise util.Abort(_("unable to read file list (%s)") % pat)
-                        pats += _normalize(files, default, root, cwd, auditor)
+                        kindpats += _normalize(files, default, root, cwd, auditor)
                         continue
+                    # else: re or relre - which cannot be normalized
+                    kindpats.append((kind, pat))
+                return kindpats
-                    pats.append((kind, name))
+            def _roots(kindpats):
-                return pats
-            def _roots(patterns):
                 '''return roots and exact explicitly listed files from patterns
                 >>> _roots([('glob', 'g/*'), ('glob', 'g'), ('glob', 'g*')])
                 ['g', 'g', '.']
                 >>> _roots([('relpath', 'r'), ('path', 'p/p'), ('path', '')])
                 ['r', 'p/p', '.']
                 >>> _roots([('relglob', 'rg*'), ('re', 're/'), ('relre', 'rr')])
                 ['.', '.', '.']
                 '''
                 r = []
-                for kind, name in patterns:
+                for kind, pat in kindpats:
                     if kind == 'glob': # find the non-glob prefix
                         root = []
-                        for p in name.split('/'):
+                        for p in pat.split('/'):
                             if '[' in p or '{' in p or '*' in p or '?' in p:
                                 break
                             root.append(p)
                         r.append('/'.join(root) or '.')
                     elif kind in ('relpath', 'path'):
-                        r.append(name or '.')
+                        r.append(pat or '.')
                     else: # relglob, re, relre
                         r.append('.')
                 return r
-            def _anypats(patterns):
+            def _anypats(kindpats):
-                for kind, name in patterns:
+                for kind, pat in kindpats:
                     if kind in ('glob', 're', 'relglob', 'relre', 'set'):
                         return True

mercurial/scmutil.py

0 +12 -5

             # scmutil.py - Mercurial core utility functions
             #
             #  Copyright Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from i18n import _
             from mercurial.node import nullrev
             import util, error, osutil, revset, similar, encoding, phases, parsers
             import pathutil
             import match as matchmod
             import os, errno, re, glob, tempfile
             if os.name == 'nt':
                 import scmwindows as scmplatform
             else:
                 import scmposix as scmplatform
             systemrcpath = scmplatform.systemrcpath
             userrcpath = scmplatform.userrcpath
             def itersubrepos(ctx1, ctx2):
                 """find subrepos in ctx1 or ctx2"""
                 # Create a (subpath, ctx) mapping where we prefer subpaths from
                 # ctx1. The subpaths from ctx2 are important when the .hgsub file
                 # has been modified (in ctx2) but not yet committed (in ctx1).
                 subpaths = dict.fromkeys(ctx2.substate, ctx2)
                 subpaths.update(dict.fromkeys(ctx1.substate, ctx1))
                 for subpath, ctx in sorted(subpaths.iteritems()):
                     yield subpath, ctx.sub(subpath)
             def nochangesfound(ui, repo, excluded=None):
                 '''Report no changes for push/pull, excluded is None or a list of
                 nodes excluded from the push/pull.
                 '''
                 secretlist = []
                 if excluded:
                     for n in excluded:
                         if n not in repo:
                             # discovery should not have included the filtered revision,
                             # we have to explicitly exclude it until discovery is cleanup.
                             continue
                         ctx = repo[n]
                         if ctx.phase() >= phases.secret and not ctx.extinct():
                             secretlist.append(n)
                 if secretlist:
                     ui.status(_("no changes found (ignored %d secret changesets)\n")
                               % len(secretlist))
                 else:
                     ui.status(_("no changes found\n"))
             def checknewlabel(repo, lbl, kind):
                 # Do not use the "kind" parameter in ui output.
                 # It makes strings difficult to translate.
                 if lbl in ['tip', '.', 'null']:
                     raise util.Abort(_("the name '%s' is reserved") % lbl)
                 for c in (':', '\0', '\n', '\r'):
                     if c in lbl:
                         raise util.Abort(_("%r cannot be used in a name") % c)
                 try:
                     int(lbl)
                     raise util.Abort(_("cannot use an integer as a name"))
                 except ValueError:
                     pass
             def checkfilename(f):
                 '''Check that the filename f is an acceptable filename for a tracked file'''
                 if '\r' in f or '\n' in f:
                     raise util.Abort(_("'\\n' and '\\r' disallowed in filenames: %r") % f)
             def checkportable(ui, f):
                 '''Check if filename f is portable and warn or abort depending on config'''
                 checkfilename(f)
                 abort, warn = checkportabilityalert(ui)
                 if abort or warn:
                     msg = util.checkwinfilename(f)
                     if msg:
                         msg = "%s: %r" % (msg, f)
                         if abort:
                             raise util.Abort(msg)
                         ui.warn(_("warning: %s\n") % msg)
             def checkportabilityalert(ui):
                 '''check if the user's config requests nothing, a warning, or abort for
                 non-portable filenames'''
                 val = ui.config('ui', 'portablefilenames', 'warn')
                 lval = val.lower()
                 bval = util.parsebool(val)
                 abort = os.name == 'nt' or lval == 'abort'
                 warn = bval or lval == 'warn'
                 if bval is None and not (warn or abort or lval == 'ignore'):
                     raise error.ConfigError(
                         _("ui.portablefilenames value is invalid ('%s')") % val)
                 return abort, warn
             class casecollisionauditor(object):
                 def __init__(self, ui, abort, dirstate):
                     self._ui = ui
                     self._abort = abort
                     allfiles = '\0'.join(dirstate._map)
                     self._loweredfiles = set(encoding.lower(allfiles).split('\0'))
                     self._dirstate = dirstate
                     # The purpose of _newfiles is so that we don't complain about
                     # case collisions if someone were to call this object with the
                     # same filename twice.
                     self._newfiles = set()
                 def __call__(self, f):
                     if f in self._newfiles:
                         return
                     fl = encoding.lower(f)
                     if fl in self._loweredfiles and f not in self._dirstate:
                         msg = _('possible case-folding collision for %s') % f
                         if self._abort:
                             raise util.Abort(msg)
                         self._ui.warn(_("warning: %s\n") % msg)
                     self._loweredfiles.add(fl)
                     self._newfiles.add(f)
             class abstractvfs(object):
                 """Abstract base class; cannot be instantiated"""
                 def __init__(self, *args, **kwargs):
                     '''Prevent instantiation; don't call this from subclasses.'''
                     raise NotImplementedError('attempted instantiating ' + str(type(self)))
                 def tryread(self, path):
                     '''gracefully return an empty string for missing files'''
                     try:
                         return self.read(path)
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     return ""
                 def open(self, path, mode="r", text=False, atomictemp=False):
                     self.open = self.__call__
                     return self.__call__(path, mode, text, atomictemp)
                 def read(self, path):
                     fp = self(path, 'rb')
                     try:
                         return fp.read()
                     finally:
                         fp.close()
                 def write(self, path, data):
                     fp = self(path, 'wb')
                     try:
                         return fp.write(data)
                     finally:
                         fp.close()
                 def append(self, path, data):
                     fp = self(path, 'ab')
                     try:
                         return fp.write(data)
                     finally:
                         fp.close()
                 def chmod(self, path, mode):
                     return os.chmod(self.join(path), mode)
                 def exists(self, path=None):
                     return os.path.exists(self.join(path))
                 def fstat(self, fp):
                     return util.fstat(fp)
                 def isdir(self, path=None):
                     return os.path.isdir(self.join(path))
                 def isfile(self, path=None):
                     return os.path.isfile(self.join(path))
                 def islink(self, path=None):
                     return os.path.islink(self.join(path))
                 def lstat(self, path=None):
                     return os.lstat(self.join(path))
                 def makedir(self, path=None, notindexed=True):
                     return util.makedir(self.join(path), notindexed)
                 def makedirs(self, path=None, mode=None):
                     return util.makedirs(self.join(path), mode)
                 def makelock(self, info, path):
                     return util.makelock(info, self.join(path))
                 def mkdir(self, path=None):
                     return os.mkdir(self.join(path))
                 def mkstemp(self, suffix='', prefix='tmp', dir=None, text=False):
                     fd, name = tempfile.mkstemp(suffix=suffix, prefix=prefix,
                                                 dir=self.join(dir), text=text)
                     dname, fname = util.split(name)
                     if dir:
                         return fd, os.path.join(dir, fname)
                     else:
                         return fd, fname
                 def readdir(self, path=None, stat=None, skip=None):
                     return osutil.listdir(self.join(path), stat, skip)
                 def readlock(self, path):
                     return util.readlock(self.join(path))
                 def rename(self, src, dst):
                     return util.rename(self.join(src), self.join(dst))
                 def readlink(self, path):
                     return os.readlink(self.join(path))
                 def setflags(self, path, l, x):
                     return util.setflags(self.join(path), l, x)
                 def stat(self, path=None):
                     return os.stat(self.join(path))
                 def unlink(self, path=None):
                     return util.unlink(self.join(path))
                 def utime(self, path=None, t=None):
                     return os.utime(self.join(path), t)
             class vfs(abstractvfs):
                 '''Operate files relative to a base directory
                 This class is used to hide the details of COW semantics and
                 remote file access from higher level code.
                 '''
                 def __init__(self, base, audit=True, expandpath=False, realpath=False):
                     if expandpath:
                         base = util.expandpath(base)
                     if realpath:
                         base = os.path.realpath(base)
                     self.base = base
                     self._setmustaudit(audit)
                     self.createmode = None
                     self._trustnlink = None
                 def _getmustaudit(self):
                     return self._audit
                 def _setmustaudit(self, onoff):
                     self._audit = onoff
                     if onoff:
                         self.audit = pathutil.pathauditor(self.base)
                     else:
                         self.audit = util.always
                 mustaudit = property(_getmustaudit, _setmustaudit)
                 @util.propertycache
                 def _cansymlink(self):
                     return util.checklink(self.base)
                 @util.propertycache
                 def _chmod(self):
                     return util.checkexec(self.base)
                 def _fixfilemode(self, name):
                     if self.createmode is None or not self._chmod:
                         return
                     os.chmod(name, self.createmode & 0666)
                 def __call__(self, path, mode="r", text=False, atomictemp=False):
                     if self._audit:
                         r = util.checkosfilename(path)
                         if r:
                             raise util.Abort("%s: %r" % (r, path))
                     self.audit(path)
                     f = self.join(path)
                     if not text and "b" not in mode:
                         mode += "b" # for that other OS
                     nlink = -1
                     if mode not in ('r', 'rb'):
                         dirname, basename = util.split(f)
                         # If basename is empty, then the path is malformed because it points
                         # to a directory. Let the posixfile() call below raise IOError.
                         if basename:
                             if atomictemp:
                                 util.ensuredirs(dirname, self.createmode)
                                 return util.atomictempfile(f, mode, self.createmode)
                             try:
                                 if 'w' in mode:
                                     util.unlink(f)
                                     nlink = 0
                                 else:
                                     # nlinks() may behave differently for files on Windows
                                     # shares if the file is open.
                                     fd = util.posixfile(f)
                                     nlink = util.nlinks(f)
                                     if nlink < 1:
                                         nlink = 2 # force mktempcopy (issue1922)
                                     fd.close()
                             except (OSError, IOError), e:
                                 if e.errno != errno.ENOENT:
                                     raise
                                 nlink = 0
                                 util.ensuredirs(dirname, self.createmode)
                             if nlink > 0:
                                 if self._trustnlink is None:
                                     self._trustnlink = nlink > 1 or util.checknlink(f)
                                 if nlink > 1 or not self._trustnlink:
                                     util.rename(util.mktempcopy(f), f)
                     fp = util.posixfile(f, mode)
                     if nlink == 0:
                         self._fixfilemode(f)
                     return fp
                 def symlink(self, src, dst):
                     self.audit(dst)
                     linkname = self.join(dst)
                     try:
                         os.unlink(linkname)
                     except OSError:
                         pass
                     util.ensuredirs(os.path.dirname(linkname), self.createmode)
                     if self._cansymlink:
                         try:
                             os.symlink(src, linkname)
                         except OSError, err:
                             raise OSError(err.errno, _('could not symlink to %r: %s') %
                                           (src, err.strerror), linkname)
                     else:
                         self.write(dst, src)
                 def join(self, path):
                     if path:
                         return os.path.join(self.base, path)
                     else:
                         return self.base
             opener = vfs
             class auditvfs(object):
                 def __init__(self, vfs):
                     self.vfs = vfs
                 def _getmustaudit(self):
                     return self.vfs.mustaudit
                 def _setmustaudit(self, onoff):
                     self.vfs.mustaudit = onoff
                 mustaudit = property(_getmustaudit, _setmustaudit)
             class filtervfs(abstractvfs, auditvfs):
                 '''Wrapper vfs for filtering filenames with a function.'''
                 def __init__(self, vfs, filter):
                     auditvfs.__init__(self, vfs)
                     self._filter = filter
                 def __call__(self, path, *args, **kwargs):
                     return self.vfs(self._filter(path), *args, **kwargs)
                 def join(self, path):
                     if path:
                         return self.vfs.join(self._filter(path))
                     else:
                         return self.vfs.join(path)
             filteropener = filtervfs
             class readonlyvfs(abstractvfs, auditvfs):
                 '''Wrapper vfs preventing any writing.'''
                 def __init__(self, vfs):
                     auditvfs.__init__(self, vfs)
                 def __call__(self, path, mode='r', *args, **kw):
                     if mode not in ('r', 'rb'):
                         raise util.Abort('this vfs is read only')
                     return self.vfs(path, mode, *args, **kw)
             def walkrepos(path, followsym=False, seen_dirs=None, recurse=False):
                 '''yield every hg repository under path, always recursively.
                 The recurse flag will only control recursion into repo working dirs'''
                 def errhandler(err):
                     if err.filename == path:
                         raise err
                 samestat = getattr(os.path, 'samestat', None)
                 if followsym and samestat is not None:
                     def adddir(dirlst, dirname):
                         match = False
                         dirstat = os.stat(dirname)
                         for lstdirstat in dirlst:
                             if samestat(dirstat, lstdirstat):
                                 match = True
                                 break
                         if not match:
                             dirlst.append(dirstat)
                         return not match
                 else:
                     followsym = False
                 if (seen_dirs is None) and followsym:
                     seen_dirs = []
                     adddir(seen_dirs, path)
                 for root, dirs, files in os.walk(path, topdown=True, onerror=errhandler):
                     dirs.sort()
                     if '.hg' in dirs:
                         yield root # found a repository
                         qroot = os.path.join(root, '.hg', 'patches')
                         if os.path.isdir(os.path.join(qroot, '.hg')):
                             yield qroot # we have a patch queue repo here
                         if recurse:
                             # avoid recursing inside the .hg directory
                             dirs.remove('.hg')
                         else:
                             dirs[:] = [] # don't descend further
                     elif followsym:
                         newdirs = []
                         for d in dirs:
                             fname = os.path.join(root, d)
                             if adddir(seen_dirs, fname):
                                 if os.path.islink(fname):
                                     for hgname in walkrepos(fname, True, seen_dirs):
                                         yield hgname
                                 else:
                                     newdirs.append(d)
                         dirs[:] = newdirs
             def osrcpath():
                 '''return default os-specific hgrc search path'''
                 path = systemrcpath()
                 path.extend(userrcpath())
                 path = [os.path.normpath(f) for f in path]
                 return path
             _rcpath = None
             def rcpath():
                 '''return hgrc search path. if env var HGRCPATH is set, use it.
                 for each item in path, if directory, use files ending in .rc,
                 else use item.
                 make HGRCPATH empty to only look in .hg/hgrc of current repo.
                 if no HGRCPATH, use default os-specific path.'''
                 global _rcpath
                 if _rcpath is None:
                     if 'HGRCPATH' in os.environ:
                         _rcpath = []
                         for p in os.environ['HGRCPATH'].split(os.pathsep):
                             if not p:
                                 continue
                             p = util.expandpath(p)
                             if os.path.isdir(p):
                                 for f, kind in osutil.listdir(p):
                                     if f.endswith('.rc'):
                                         _rcpath.append(os.path.join(p, f))
                             else:
                                 _rcpath.append(p)
                     else:
                         _rcpath = osrcpath()
                 return _rcpath
             def revsingle(repo, revspec, default='.'):
                 if not revspec and revspec != 0:
                     return repo[default]
                 l = revrange(repo, [revspec])
                 if len(l) < 1:
                     raise util.Abort(_('empty revision set'))
                 return repo[l[-1]]
             def revpair(repo, revs):
                 if not revs:
                     return repo.dirstate.p1(), None
                 l = revrange(repo, revs)
                 if not l:
                     first = second = None
                 elif l.isascending():
                     first = l.min()
                     second = l.max()
                 elif l.isdescending():
                     first = l.max()
                     second = l.min()
                 else:
                     l = list(l)
                     first = l[0]
                     second = l[-1]
                 if first is None:
                     raise util.Abort(_('empty revision range'))
                 if first == second and len(revs) == 1 and _revrangesep not in revs[0]:
                     return repo.lookup(first), None
                 return repo.lookup(first), repo.lookup(second)
             _revrangesep = ':'
             def revrange(repo, revs):
                 """Yield revision as strings from a list of revision specifications."""
                 def revfix(repo, val, defval):
                     if not val and val != 0 and defval is not None:
                         return defval
                     return repo[val].rev()
                 seen, l = set(), revset.baseset([])
                 for spec in revs:
                     if l and not seen:
                         seen = set(l)
                     # attempt to parse old-style ranges first to deal with
                     # things like old-tag which contain query metacharacters
                     try:
                         if isinstance(spec, int):
                             seen.add(spec)
                             l = l + revset.baseset([spec])
                             continue
                         if _revrangesep in spec:
                             start, end = spec.split(_revrangesep, 1)
                             start = revfix(repo, start, 0)
                             end = revfix(repo, end, len(repo) - 1)
                             if end == nullrev and start < 0:
                                 start = nullrev
                             rangeiter = repo.changelog.revs(start, end)
                             if not seen and not l:
                                 # by far the most common case: revs = ["-1:0"]
                                 l = revset.baseset(rangeiter)
                                 # defer syncing seen until next iteration
                                 continue
                             newrevs = set(rangeiter)
                             if seen:
                                 newrevs.difference_update(seen)
                                 seen.update(newrevs)
                             else:
                                 seen = newrevs
                             l = l + revset.baseset(sorted(newrevs, reverse=start > end))
                             continue
                         elif spec and spec in repo: # single unquoted rev
                             rev = revfix(repo, spec, None)
                             if rev in seen:
                                 continue
                             seen.add(rev)
                             l = l + revset.baseset([rev])
                             continue
                     except error.RepoLookupError:
                         pass
                     # fall through to new-style queries if old-style fails
                     m = revset.match(repo.ui, spec, repo)
                     if seen or l:
                         dl = [r for r in m(repo, revset.spanset(repo)) if r not in seen]
                         l = l + revset.baseset(dl)
                         seen.update(dl)
                     else:
                         l = m(repo, revset.spanset(repo))
                 return l
             def expandpats(pats):
+                '''Expand bare globs when running on windows.
+                On posix we assume it already has already been done by sh.'''
                 if not util.expandglobs:
                     return list(pats)
                 ret = []
-                for p in pats:
+                for kindpat in pats:
-                    kind, name = matchmod._patsplit(p, None)
+                    kind, pat = matchmod._patsplit(kindpat, None)
                     if kind is None:
                         try:
-                            globbed = glob.glob(name)
+                            globbed = glob.glob(pat)
                         except re.error:
-                            globbed = [name]
+                            globbed = [pat]
                         if globbed:
                             ret.extend(globbed)
                             continue
-                    ret.append(p)
+                    ret.append(kindpat)
                 return ret
             def matchandpats(ctx, pats=[], opts={}, globbed=False, default='relpath'):
+                '''Return a matcher and the patterns that were used.
+                The matcher will warn about bad matches.'''
                 if pats == ("",):
                     pats = []
                 if not globbed and default == 'relpath':
                     pats = expandpats(pats or [])
                 m = ctx.match(pats, opts.get('include'), opts.get('exclude'),
                                      default)
                 def badfn(f, msg):
                     ctx._repo.ui.warn("%s: %s\n" % (m.rel(f), msg))
                 m.bad = badfn
                 return m, pats
             def match(ctx, pats=[], opts={}, globbed=False, default='relpath'):
+                '''Return a matcher that will warn about bad matches.'''
                 return matchandpats(ctx, pats, opts, globbed, default)[0]
             def matchall(repo):
+                '''Return a matcher that will efficiently match everything.'''
                 return matchmod.always(repo.root, repo.getcwd())
             def matchfiles(repo, files):
+                '''Return a matcher that will efficiently match exactly these files.'''
                 return matchmod.exact(repo.root, repo.getcwd(), files)
             def addremove(repo, pats=[], opts={}, dry_run=None, similarity=None):
                 if dry_run is None:
                     dry_run = opts.get('dry_run')
                 if similarity is None:
                     similarity = float(opts.get('similarity') or 0)
                 # we'd use status here, except handling of symlinks and ignore is tricky
                 m = match(repo[None], pats, opts)
                 rejected = []
                 m.bad = lambda x, y: rejected.append(x)
                 added, unknown, deleted, removed = _interestingfiles(repo, m)
                 unknownset = set(unknown)
                 toprint = unknownset.copy()
                 toprint.update(deleted)
                 for abs in sorted(toprint):
                     if repo.ui.verbose or not m.exact(abs):
                         rel = m.rel(abs)
                         if abs in unknownset:
                             status = _('adding %s\n') % ((pats and rel) or abs)
                         else:
                             status = _('removing %s\n') % ((pats and rel) or abs)
                         repo.ui.status(status)
                 renames = _findrenames(repo, m, added + unknown, removed + deleted,
                                        similarity)
                 if not dry_run:
                     _markchanges(repo, unknown, deleted, renames)
                 for f in rejected:
                     if f in m.files():
                         return 1
                 return 0
             def marktouched(repo, files, similarity=0.0):
                 '''Assert that files have somehow been operated upon. files are relative to
                 the repo root.'''
                 m = matchfiles(repo, files)
                 rejected = []
                 m.bad = lambda x, y: rejected.append(x)
                 added, unknown, deleted, removed = _interestingfiles(repo, m)
                 if repo.ui.verbose:
                     unknownset = set(unknown)
                     toprint = unknownset.copy()
                     toprint.update(deleted)
                     for abs in sorted(toprint):
                         if abs in unknownset:
                             status = _('adding %s\n') % abs
                         else:
                             status = _('removing %s\n') % abs
                         repo.ui.status(status)
                 renames = _findrenames(repo, m, added + unknown, removed + deleted,
                                        similarity)
                 _markchanges(repo, unknown, deleted, renames)
                 for f in rejected:
                     if f in m.files():
                         return 1
                 return 0
             def _interestingfiles(repo, matcher):
                 '''Walk dirstate with matcher, looking for files that addremove would care
                 about.
                 This is different from dirstate.status because it doesn't care about
                 whether files are modified or clean.'''
                 added, unknown, deleted, removed = [], [], [], []
                 audit_path = pathutil.pathauditor(repo.root)
                 ctx = repo[None]
                 dirstate = repo.dirstate
                 walkresults = dirstate.walk(matcher, sorted(ctx.substate), True, False,
                                             full=False)
                 for abs, st in walkresults.iteritems():
                     dstate = dirstate[abs]
                     if dstate == '?' and audit_path.check(abs):
                         unknown.append(abs)
                     elif dstate != 'r' and not st:
                         deleted.append(abs)
                     # for finding renames
                     elif dstate == 'r':
                         removed.append(abs)
                     elif dstate == 'a':
                         added.append(abs)
                 return added, unknown, deleted, removed
             def _findrenames(repo, matcher, added, removed, similarity):
                 '''Find renames from removed files to added ones.'''
                 renames = {}
                 if similarity > 0:
                     for old, new, score in similar.findrenames(repo, added, removed,
                                                                similarity):
                         if (repo.ui.verbose or not matcher.exact(old)
                             or not matcher.exact(new)):
                             repo.ui.status(_('recording removal of %s as rename to %s '
                                              '(%d%% similar)\n') %
                                            (matcher.rel(old), matcher.rel(new),
                                             score * 100))
                         renames[new] = old
                 return renames
             def _markchanges(repo, unknown, deleted, renames):
                 '''Marks the files in unknown as added, the files in deleted as removed,
                 and the files in renames as copied.'''
                 wctx = repo[None]
                 wlock = repo.wlock()
                 try:
                     wctx.forget(deleted)
                     wctx.add(unknown)
                     for new, old in renames.iteritems():
                         wctx.copy(old, new)
                 finally:
                     wlock.release()
             def dirstatecopy(ui, repo, wctx, src, dst, dryrun=False, cwd=None):
                 """Update the dirstate to reflect the intent of copying src to dst. For
                 different reasons it might not end with dst being marked as copied from src.
                 """
                 origsrc = repo.dirstate.copied(src) or src
                 if dst == origsrc: # copying back a copy?
                     if repo.dirstate[dst] not in 'mn' and not dryrun:
                         repo.dirstate.normallookup(dst)
                 else:
                     if repo.dirstate[origsrc] == 'a' and origsrc == src:
                         if not ui.quiet:
                             ui.warn(_("%s has not been committed yet, so no copy "
                                       "data will be stored for %s.\n")
                                     % (repo.pathto(origsrc, cwd), repo.pathto(dst, cwd)))
                         if repo.dirstate[dst] in '?r' and not dryrun:
                             wctx.add([dst])
                     elif not dryrun:
                         wctx.copy(origsrc, dst)
             def readrequires(opener, supported):
                 '''Reads and parses .hg/requires and checks if all entries found
                 are in the list of supported features.'''
                 requirements = set(opener.read("requires").splitlines())
                 missings = []
                 for r in requirements:
                     if r not in supported:
                         if not r or not r[0].isalnum():
                             raise error.RequirementError(_(".hg/requires file is corrupt"))
                         missings.append(r)
                 missings.sort()
                 if missings:
                     raise error.RequirementError(
                         _("repository requires features unknown to this Mercurial: %s")
                         % " ".join(missings),
                         hint=_("see http://mercurial.selenic.com/wiki/MissingRequirement"
                                " for more information"))
                 return requirements
             class filecachesubentry(object):
                 def __init__(self, path, stat):
                     self.path = path
                     self.cachestat = None
                     self._cacheable = None
                     if stat:
                         self.cachestat = filecachesubentry.stat(self.path)
                         if self.cachestat:
                             self._cacheable = self.cachestat.cacheable()
                         else:
                             # None means we don't know yet
                             self._cacheable = None
                 def refresh(self):
                     if self.cacheable():
                         self.cachestat = filecachesubentry.stat(self.path)
                 def cacheable(self):
                     if self._cacheable is not None:
                         return self._cacheable
                     # we don't know yet, assume it is for now
                     return True
                 def changed(self):
                     # no point in going further if we can't cache it
                     if not self.cacheable():
                         return True
                     newstat = filecachesubentry.stat(self.path)
                     # we may not know if it's cacheable yet, check again now
                     if newstat and self._cacheable is None:
                         self._cacheable = newstat.cacheable()
                         # check again
                         if not self._cacheable:
                             return True
                     if self.cachestat != newstat:
                         self.cachestat = newstat
                         return True
                     else:
                         return False
                 @staticmethod
                 def stat(path):
                     try:
                         return util.cachestat(path)
                     except OSError, e:
                         if e.errno != errno.ENOENT:
                             raise
             class filecacheentry(object):
                 def __init__(self, paths, stat=True):
                     self._entries = []
                     for path in paths:
                         self._entries.append(filecachesubentry(path, stat))
                 def changed(self):
                     '''true if any entry has changed'''
                     for entry in self._entries:
                         if entry.changed():
                             return True
                     return False
                 def refresh(self):
                     for entry in self._entries:
                         entry.refresh()
             class filecache(object):
                 '''A property like decorator that tracks files under .hg/ for updates.
                 Records stat info when called in _filecache.
                 On subsequent calls, compares old stat info with new info, and recreates the
                 object when any of the files changes, updating the new stat info in
                 _filecache.
                 Mercurial either atomic renames or appends for files under .hg,
                 so to ensure the cache is reliable we need the filesystem to be able
                 to tell us if a file has been replaced. If it can't, we fallback to
                 recreating the object on every call (essentially the same behaviour as
                 propertycache).
                 '''
                 def __init__(self, *paths):
                     self.paths = paths
                 def join(self, obj, fname):
                     """Used to compute the runtime path of a cached file.
                     Users should subclass filecache and provide their own version of this
                     function to call the appropriate join function on 'obj' (an instance
                     of the class that its member function was decorated).
                     """
                     return obj.join(fname)
                 def __call__(self, func):
                     self.func = func
                     self.name = func.__name__
                     return self
                 def __get__(self, obj, type=None):
                     # do we need to check if the file changed?
                     if self.name in obj.__dict__:
                         assert self.name in obj._filecache, self.name
                         return obj.__dict__[self.name]
                     entry = obj._filecache.get(self.name)
                     if entry:
                         if entry.changed():
                             entry.obj = self.func(obj)
                     else:
                         paths = [self.join(obj, path) for path in self.paths]
                         # We stat -before- creating the object so our cache doesn't lie if
                         # a writer modified between the time we read and stat
                         entry = filecacheentry(paths, True)
                         entry.obj = self.func(obj)
                         obj._filecache[self.name] = entry
                     obj.__dict__[self.name] = entry.obj
                     return entry.obj
                 def __set__(self, obj, value):
                     if self.name not in obj._filecache:
                         # we add an entry for the missing value because X in __dict__
                         # implies X in _filecache
                         paths = [self.join(obj, path) for path in self.paths]
                         ce = filecacheentry(paths, False)
                         obj._filecache[self.name] = ce
                     else:
                         ce = obj._filecache[self.name]
                     ce.obj = value # update cached copy
                     obj.__dict__[self.name] = value # update copy returned by obj.x
                 def __delete__(self, obj):
                     try:
                         del obj.__dict__[self.name]
                     except KeyError:
                         raise AttributeError(self.name)
             class dirs(object):
                 '''a multiset of directory names from a dirstate or manifest'''
                 def __init__(self, map, skip=None):
                     self._dirs = {}
                     addpath = self.addpath
                     if util.safehasattr(map, 'iteritems') and skip is not None:
                         for f, s in map.iteritems():
                             if s[0] != skip:
                                 addpath(f)
                     else:
                         for f in map:
                             addpath(f)
                 def addpath(self, path):
                     dirs = self._dirs
                     for base in finddirs(path):
                         if base in dirs:
                             dirs[base] += 1
                             return
                         dirs[base] = 1
                 def delpath(self, path):
                     dirs = self._dirs
                     for base in finddirs(path):
                         if dirs[base] > 1:
                             dirs[base] -= 1
                             return
                         del dirs[base]
                 def __iter__(self):
                     return self._dirs.iterkeys()
                 def __contains__(self, d):
                     return d in self._dirs
             if util.safehasattr(parsers, 'dirs'):
                 dirs = parsers.dirs
             def finddirs(path):
                 pos = path.rfind('/')
                 while pos != -1:
                     yield path[:pos]
                     pos = path.rfind('/', 0, pos)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages