upstream/mercurial-mirror Files · mercurial/fileset.py

localrepo: add branchtip() method for faster single-branch lookups...

localrepo: add branchtip() method for faster single-branch lookups For the PyPy repo with 744 branches and 843 branch heads, this brings hg log -r default over NFS from: CallCount Recursive Total(ms) Inline(ms) module:lineno(function) 3249 0 1.3222 1.3222 <open> 3244 0 0.6211 0.6211 <method 'close' of 'file' objects> 3243 0 0.0800 0.0800 <method 'read' of 'file' objects> 3241 0 0.0660 0.0660 <method 'seek' of 'file' objects> 3905 0 0.0476 0.0476 <zlib.decompress> 3281 0 2.6756 0.0472 mercurial.changelog:182(read) +3281 0 2.5256 0.0453 +mercurial.revlog:881(revision) +3276 0 0.0389 0.0196 +mercurial.changelog:28(decodeextra) +6562 0 0.0123 0.0123 +<method 'split' of 'str' objects> +6562 0 0.0408 0.0073 +mercurial.encoding:61(tolocal) +3281 0 0.0054 0.0054 +<method 'index' of 'str' objects> 3241 0 2.2464 0.0456 mercurial.revlog:818(_loadchunk) +3241 0 0.6205 0.6205 +<method 'close' of 'file' objects> +3241 0 0.0765 0.0765 +<method 'read' of 'file' objects> +3241 0 0.0660 0.0660 +<method 'seek' of 'file' objects> +3241 0 1.4209 0.0135 +mercurial.store:374(__call__) +3241 0 0.0122 0.0107 +mercurial.revlog:810(_addchunk) 3281 0 2.5256 0.0453 mercurial.revlog:881(revision) +3280 0 0.0175 0.0175 +mercurial.revlog:305(rev) +3281 0 2.2819 0.0119 +mercurial.revlog:847(_chunkraw) +3281 0 0.0603 0.0083 +mercurial.revlog:945(_checkhash) +3281 0 0.0051 0.0051 +mercurial.revlog:349(flags) +3281 0 0.0040 0.0040 +<mercurial.mpatch.patches> 13682 0 0.0479 0.0248 <method 'decode' of 'str' objects> +7418 0 0.0228 0.0076 +encodings.utf_8:15(decode) +1 0 0.0003 0.0000 +encodings:71(search_function) 3248 0 1.3995 0.0246 mercurial.scmutil:218(__call__) +3248 0 1.3222 1.3222 +<open> +3248 0 0.0235 0.0184 +os.path:80(split) +3248 0 0.0084 0.0068 +mercurial.scmutil:92(__call__) Time: real 2.750 secs (user 0.680+0.000 sys 0.360+0.000) down to: CallCount Recursive Total(ms) Inline(ms) module:lineno(function) 55 31 0.0197 0.0163 <__import__> +1 0 0.0006 0.0002 +mercurial.context:8(<module>) +1 0 0.0042 0.0001 +mercurial.revlog:12(<module>) +1 0 0.0002 0.0001 +mercurial.match:8(<module>) +1 0 0.0003 0.0001 +mercurial.dirstate:7(<module>) +1 0 0.0057 0.0001 +mercurial.changelog:8(<module>) 1 0 0.0117 0.0032 mercurial.localrepo:525(_readbranchcache) +844 0 0.0015 0.0015 +<binascii.unhexlify> +845 0 0.0010 0.0010 +<method 'split' of 'str' objects> +843 0 0.0045 0.0009 +mercurial.encoding:61(tolocal) +843 0 0.0004 0.0004 +<method 'setdefault' of 'dict' objects> +1 0 0.0003 0.0003 +<method 'close' of 'file' objects> 3 0 0.0029 0.0029 <method 'read' of 'file' objects> 9 0 0.0018 0.0018 <open> 990 0 0.0017 0.0017 <binascii.unhexlify> 53 0 0.0016 0.0016 mercurial.demandimport:43(__init__) 862 0 0.0015 0.0015 <_codecs.utf_8_decode> 862 0 0.0037 0.0014 <method 'decode' of 'str' objects> +862 0 0.0023 0.0008 +encodings.utf_8:15(decode) 981 0 0.0011 0.0011 <method 'split' of 'str' objects> 861 0 0.0046 0.0009 mercurial.encoding:61(tolocal) +861 0 0.0037 0.0014 +<method 'decode' of 'str' objects> 862 0 0.0023 0.0008 encodings.utf_8:15(decode) +862 0 0.0015 0.0015 +<_codecs.utf_8_decode> 4 0 0.0008 0.0008 <method 'close' of 'file' objects> 179 154 0.0202 0.0004 mercurial.demandimport:83(__getattribute__) +36 11 0.0199 0.0003 +mercurial.demandimport:55(_load) +72 0 0.0001 0.0001 +mercurial.demandimport:83(__getattribute__) +36 0 0.0000 0.0000 +<getattr> 1 0 0.0015 0.0004 mercurial.tags:148(_readtagcache) Time: real 0.060 secs (user 0.030+0.000 sys 0.010+0.000)

Angel Ezquerra - - Load All Authors

File last commit:

r16443:9e02e032 default


                r16719:e7bf09ac

default

Download file

             fileset.py
        
                    465 lines
            
             | 13.4 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / fileset.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # fileset.py - file set queries for mercurial

      #

      # Copyright 2010 Matt Mackall <mpm@selenic.com>

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      import parser, error, util, merge, re

      from i18n import _

      elements = {

          "(": (20, ("group", 1, ")"), ("func", 1, ")")),

          "-": (5, ("negate", 19), ("minus", 5)),

          "not": (10, ("not", 10)),

          "!": (10, ("not", 10)),

          "and": (5, None, ("and", 5)),

          "&": (5, None, ("and", 5)),

          "or": (4, None, ("or", 4)),

          "|": (4, None, ("or", 4)),

          "+": (4, None, ("or", 4)),

          ",": (2, None, ("list", 2)),

          ")": (0, None, None),

          "symbol": (0, ("symbol",), None),

          "string": (0, ("string",), None),

          "end": (0, None, None),

      }

      keywords = set(['and', 'or', 'not'])

      globchars = ".*{}[]?/\\"

      def tokenize(program):

          pos, l = 0, len(program)

          while pos < l:

              c = program[pos]

              if c.isspace(): # skip inter-token whitespace

                  pass

              elif c in "(),-|&+!": # handle simple operators

                  yield (c, None, pos)

              elif (c in '"\'' or c == 'r' and

                    program[pos:pos + 2] in ("r'", 'r"')): # handle quoted strings

                  if c == 'r':

                      pos += 1

                      c = program[pos]

                      decode = lambda x: x

                  else:

                      decode = lambda x: x.decode('string-escape')

                  pos += 1

                  s = pos

                  while pos < l: # find closing quote

                      d = program[pos]

                      if d == '\\': # skip over escaped characters

                          pos += 2

                          continue

                      if d == c:

                          yield ('string', decode(program[s:pos]), s)

                          break

                      pos += 1

                  else:

                      raise error.ParseError(_("unterminated string"), s)

              elif c.isalnum() or c in globchars or ord(c) > 127:

                  # gather up a symbol/keyword

                  s = pos

                  pos += 1

                  while pos < l: # find end of symbol

                      d = program[pos]

                      if not (d.isalnum() or d in globchars or ord(d) > 127):

                          break

                      pos += 1

                  sym = program[s:pos]

                  if sym in keywords: # operator keywords

                      yield (sym, None, s)

                  else:

                      yield ('symbol', sym, s)

                  pos -= 1

              else:

                  raise error.ParseError(_("syntax error"), pos)

              pos += 1

          yield ('end', None, pos)

      parse = parser.parser(tokenize, elements).parse

      def getstring(x, err):

          if x and (x[0] == 'string' or x[0] == 'symbol'):

              return x[1]

          raise error.ParseError(err)

      def getset(mctx, x):

          if not x:

              raise error.ParseError(_("missing argument"))

          return methods[x[0]](mctx, *x[1:])

      def stringset(mctx, x):

          m = mctx.matcher([x])

          return [f for f in mctx.subset if m(f)]

      def andset(mctx, x, y):

          return getset(mctx.narrow(getset(mctx, x)), y)

      def orset(mctx, x, y):

          # needs optimizing

          xl = getset(mctx, x)

          yl = getset(mctx, y)

          return xl + [f for f in yl if f not in xl]

      def notset(mctx, x):

          s = set(getset(mctx, x))

          return [r for r in mctx.subset if r not in s]

      def listset(mctx, a, b):

          raise error.ParseError(_("can't use a list in this context"))

      def modified(mctx, x):

          """``modified()``

          File that is modified according to status.

          """

          # i18n: "modified" is a keyword

          getargs(x, 0, 0, _("modified takes no arguments"))

          s = mctx.status()[0]

          return [f for f in mctx.subset if f in s]

      def added(mctx, x):

          """``added()``

          File that is added according to status.

          """

          # i18n: "added" is a keyword

          getargs(x, 0, 0, _("added takes no arguments"))

          s = mctx.status()[1]

          return [f for f in mctx.subset if f in s]

      def removed(mctx, x):

          """``removed()``

          File that is removed according to status.

          """

          # i18n: "removed" is a keyword

          getargs(x, 0, 0, _("removed takes no arguments"))

          s = mctx.status()[2]

          return [f for f in mctx.subset if f in s]

      def deleted(mctx, x):

          """``deleted()``

          File that is deleted according to status.

          """

          # i18n: "deleted" is a keyword

          getargs(x, 0, 0, _("deleted takes no arguments"))

          s = mctx.status()[3]

          return [f for f in mctx.subset if f in s]

      def unknown(mctx, x):

          """``unknown()``

          File that is unknown according to status. These files will only be

          considered if this predicate is used.

          """

          # i18n: "unknown" is a keyword

          getargs(x, 0, 0, _("unknown takes no arguments"))

          s = mctx.status()[4]

          return [f for f in mctx.subset if f in s]

      def ignored(mctx, x):

          """``ignored()``

          File that is ignored according to status. These files will only be

          considered if this predicate is used.

          """

          # i18n: "ignored" is a keyword

          getargs(x, 0, 0, _("ignored takes no arguments"))

          s = mctx.status()[5]

          return [f for f in mctx.subset if f in s]

      def clean(mctx, x):

          """``clean()``

          File that is clean according to status.

          """

          # i18n: "clean" is a keyword

          getargs(x, 0, 0, _("clean takes no arguments"))

          s = mctx.status()[6]

          return [f for f in mctx.subset if f in s]

      def func(mctx, a, b):

          if a[0] == 'symbol' and a[1] in symbols:

              return symbols[a[1]](mctx, b)

          raise error.ParseError(_("not a function: %s") % a[1])

      def getlist(x):

          if not x:

              return []

          if x[0] == 'list':

              return getlist(x[1]) + [x[2]]

          return [x]

      def getargs(x, min, max, err):

          l = getlist(x)

          if len(l) < min or len(l) > max:

              raise error.ParseError(err)

          return l

      def binary(mctx, x):

          """``binary()``

          File that appears to be binary (contains NUL bytes).

          """

          # i18n: "binary" is a keyword

          getargs(x, 0, 0, _("binary takes no arguments"))

          return [f for f in mctx.existing() if util.binary(mctx.ctx[f].data())]

      def exec_(mctx, x):

          """``exec()``

          File that is marked as executable.

          """

          # i18n: "exec" is a keyword

          getargs(x, 0, 0, _("exec takes no arguments"))

          return [f for f in mctx.existing() if mctx.ctx.flags(f) == 'x']

      def symlink(mctx, x):

          """``symlink()``

          File that is marked as a symlink.

          """

          # i18n: "symlink" is a keyword

          getargs(x, 0, 0, _("symlink takes no arguments"))

          return [f for f in mctx.existing() if mctx.ctx.flags(f) == 'l']

      def resolved(mctx, x):

          """``resolved()``

          File that is marked resolved according to the resolve state.

          """

          # i18n: "resolved" is a keyword

          getargs(x, 0, 0, _("resolved takes no arguments"))

          if mctx.ctx.rev() is not None:

              return []

          ms = merge.mergestate(mctx.ctx._repo)

          return [f for f in mctx.subset if f in ms and ms[f] == 'r']

      def unresolved(mctx, x):

          """``unresolved()``

          File that is marked unresolved according to the resolve state.

          """

          # i18n: "unresolved" is a keyword

          getargs(x, 0, 0, _("unresolved takes no arguments"))

          if mctx.ctx.rev() is not None:

              return []

          ms = merge.mergestate(mctx.ctx._repo)

          return [f for f in mctx.subset if f in ms and ms[f] == 'u']

      def hgignore(mctx, x):

          """``hgignore()``

          File that matches the active .hgignore pattern.

          """

          getargs(x, 0, 0, _("hgignore takes no arguments"))

          ignore = mctx.ctx._repo.dirstate._ignore

          return [f for f in mctx.subset if ignore(f)]

      def grep(mctx, x):

          """``grep(regex)``

          File contains the given regular expression.

          """

          pat = getstring(x, _("grep requires a pattern"))

          r = re.compile(pat)

          return [f for f in mctx.existing() if r.search(mctx.ctx[f].data())]

      _units = dict(k=2**10, K=2**10, kB=2**10, KB=2**10,

                    M=2**20, MB=2**20, G=2**30, GB=2**30)

      def _sizetoint(s):

          try:

              s = s.strip()

              for k, v in _units.items():

                  if s.endswith(k):

                      return int(float(s[:-len(k)]) * v)

              return int(s)

          except ValueError:

              raise error.ParseError(_("couldn't parse size: %s") % s)

      def _sizetomax(s):

          try:

              s = s.strip()

              for k, v in _units.items():

                  if s.endswith(k):

                      # max(4k) = 5k - 1, max(4.5k) = 4.6k - 1

                      n = s[:-len(k)]

                      inc = 1.0

                      if "." in n:

                          inc /= 10 ** len(n.split(".")[1])

                      return int((float(n) + inc) * v) - 1

              # no extension, this is a precise value

              return int(s)

          except ValueError:

              raise error.ParseError(_("couldn't parse size: %s") % s)

      def size(mctx, x):

          """``size(expression)``

          File size matches the given expression. Examples:

          - 1k (files from 1024 to 2047 bytes)

          - < 20k (files less than 20480 bytes)

          - >= .5MB (files at least 524288 bytes)

          - 4k - 1MB (files from 4096 bytes to 1048576 bytes)

          """

          # i18n: "size" is a keyword

          expr = getstring(x, _("size requires an expression")).strip()

          if '-' in expr: # do we have a range?

              a, b = expr.split('-', 1)

              a = _sizetoint(a)

              b = _sizetoint(b)

              m = lambda x: x >= a and x <= b

          elif expr.startswith("<="):

              a = _sizetoint(expr[2:])

              m = lambda x: x <= a

          elif expr.startswith("<"):

              a = _sizetoint(expr[1:])

              m = lambda x: x < a

          elif expr.startswith(">="):

              a = _sizetoint(expr[2:])

              m = lambda x: x >= a

          elif expr.startswith(">"):

              a = _sizetoint(expr[1:])

              m = lambda x: x > a

          elif expr[0].isdigit or expr[0] == '.':

              a = _sizetoint(expr)

              b = _sizetomax(expr)

              m = lambda x: x >= a and x <= b

          else:

              raise error.ParseError(_("couldn't parse size: %s") % expr)

          return [f for f in mctx.existing() if m(mctx.ctx[f].size())]

      def encoding(mctx, x):

          """``encoding(name)``

          File can be successfully decoded with the given character

          encoding. May not be useful for encodings other than ASCII and

          UTF-8.

          """

          # i18n: "encoding" is a keyword

          enc = getstring(x, _("encoding requires an encoding name"))

          s = []

          for f in mctx.existing():

              d = mctx.ctx[f].data()

              try:

                  d.decode(enc)

              except LookupError:

                  raise util.Abort(_("unknown encoding '%s'") % enc)

              except UnicodeDecodeError:

                  continue

              s.append(f)

          return s

      def copied(mctx, x):

          """``copied()``

          File that is recorded as being copied.

          """

          # i18n: "copied" is a keyword

          getargs(x, 0, 0, _("copied takes no arguments"))

          s = []

          for f in mctx.subset:

              p = mctx.ctx[f].parents()

              if p and p[0].path() != f:

                  s.append(f)

          return s

      def subrepo(mctx, x):

          """``subrepo([pattern])``

          Subrepositories whose paths match the given pattern.

          """

          # i18n: "subrepo" is a keyword

          getargs(x, 0, 1, _("subrepo takes at most one argument"))

          ctx = mctx.ctx

          sstate = ctx.substate

          if x:

              pat = getstring(x, _("subrepo requires a pattern or no arguments"))

              import match as matchmod # avoid circular import issues

              fast = not matchmod.patkind(pat)

              if fast:

                  def m(s):

                      return (s == pat)

              else:

                  m = matchmod.match(ctx._repo.root, '', [pat], ctx=ctx)

              return [sub for sub in sstate if m(sub)]

          else:

              return [sub for sub in sstate]

      symbols = {

          'added': added,

          'binary': binary,

          'clean': clean,

          'copied': copied,

          'deleted': deleted,

          'encoding': encoding,

          'exec': exec_,

          'grep': grep,

          'ignored': ignored,

          'hgignore': hgignore,

          'modified': modified,

          'removed': removed,

          'resolved': resolved,

          'size': size,

          'symlink': symlink,

          'unknown': unknown,

          'unresolved': unresolved,

          'subrepo': subrepo,

      }

      methods = {

          'string': stringset,

          'symbol': stringset,

          'and': andset,

          'or': orset,

          'list': listset,

          'group': getset,

          'not': notset,

          'func': func,

      }

      class matchctx(object):

          def __init__(self, ctx, subset=None, status=None):

              self.ctx = ctx

              self.subset = subset

              self._status = status

          def status(self):

              return self._status

          def matcher(self, patterns):

              return self.ctx.match(patterns)

          def filter(self, files):

              return [f for f in files if f in self.subset]

          def existing(self):

              return (f for f in self.subset if f in self.ctx)

          def narrow(self, files):

              return matchctx(self.ctx, self.filter(files), self._status)

      def _intree(funcs, tree):

          if isinstance(tree, tuple):

              if tree[0] == 'func' and tree[1][0] == 'symbol':

                  if tree[1][1] in funcs:

                      return True

              for s in tree[1:]:

                  if _intree(funcs, s):

                      return True

          return False

      def getfileset(ctx, expr):

          tree, pos = parse(expr)

          if (pos != len(expr)):

              raise error.ParseError(_("invalid token"), pos)

          # do we need status info?

          if _intree(['modified', 'added', 'removed', 'deleted',

                      'unknown', 'ignored', 'clean'], tree):

              unknown = _intree(['unknown'], tree)

              ignored = _intree(['ignored'], tree)

              r = ctx._repo

              status = r.status(ctx.p1(), ctx,

                                unknown=unknown, ignored=ignored, clean=True)

              subset = []

              for c in status:

                  subset.extend(c)

          else:

              status = None

              subset = ctx.walk(ctx.match([]))

          return getset(matchctx(ctx, subset, status), tree)

      # tell hggettext to extract docstrings from these functions:

      i18nfunctions = symbols.values()

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				# fileset.py - file set queries for mercurial
				#
				# Copyright 2010 Matt Mackall <mpm@selenic.com>
				#
				# This software may be used and distributed according to the terms of the
				# GNU General Public License version 2 or any later version.

				import parser, error, util, merge, re
				from i18n import _

				elements = {
				"(": (20, ("group", 1, ")"), ("func", 1, ")")),
				"-": (5, ("negate", 19), ("minus", 5)),
				"not": (10, ("not", 10)),
				"!": (10, ("not", 10)),
				"and": (5, None, ("and", 5)),
				"&": (5, None, ("and", 5)),
				"or": (4, None, ("or", 4)),
				"\|": (4, None, ("or", 4)),
				"+": (4, None, ("or", 4)),
				",": (2, None, ("list", 2)),
				")": (0, None, None),
				"symbol": (0, ("symbol",), None),
				"string": (0, ("string",), None),
				"end": (0, None, None),
				}

				keywords = set(['and', 'or', 'not'])

				globchars = ".*{}[]?/\\"

				def tokenize(program):
				pos, l = 0, len(program)
				while pos < l:
				c = program[pos]
				if c.isspace(): # skip inter-token whitespace
				pass
				elif c in "(),-\|&+!": # handle simple operators
				yield (c, None, pos)
				elif (c in '"\'' or c == 'r' and
				program[pos:pos + 2] in ("r'", 'r"')): # handle quoted strings
				if c == 'r':
				pos += 1
				c = program[pos]
				decode = lambda x: x
				else:
				decode = lambda x: x.decode('string-escape')
				pos += 1
				s = pos
				while pos < l: # find closing quote
				d = program[pos]
				if d == '\\': # skip over escaped characters
				pos += 2
				continue
				if d == c:
				yield ('string', decode(program[s:pos]), s)
				break
				pos += 1
				else:
				raise error.ParseError(_("unterminated string"), s)
				elif c.isalnum() or c in globchars or ord(c) > 127:
				# gather up a symbol/keyword
				s = pos
				pos += 1
				while pos < l: # find end of symbol
				d = program[pos]
				if not (d.isalnum() or d in globchars or ord(d) > 127):
				break
				pos += 1
				sym = program[s:pos]
				if sym in keywords: # operator keywords
				yield (sym, None, s)
				else:
				yield ('symbol', sym, s)
				pos -= 1
				else:
				raise error.ParseError(_("syntax error"), pos)
				pos += 1
				yield ('end', None, pos)

				parse = parser.parser(tokenize, elements).parse

				def getstring(x, err):
				if x and (x[0] == 'string' or x[0] == 'symbol'):
				return x[1]
				raise error.ParseError(err)

				def getset(mctx, x):
				if not x:
				raise error.ParseError(_("missing argument"))
				return methods[x[0]](mctx, *x[1:])

				def stringset(mctx, x):
				m = mctx.matcher([x])
				return [f for f in mctx.subset if m(f)]

				def andset(mctx, x, y):
				return getset(mctx.narrow(getset(mctx, x)), y)

				def orset(mctx, x, y):
				# needs optimizing
				xl = getset(mctx, x)
				yl = getset(mctx, y)
				return xl + [f for f in yl if f not in xl]

				def notset(mctx, x):
				s = set(getset(mctx, x))
				return [r for r in mctx.subset if r not in s]

				def listset(mctx, a, b):
				raise error.ParseError(_("can't use a list in this context"))

				def modified(mctx, x):
				"""``modified()``
				File that is modified according to status.
				"""
				# i18n: "modified" is a keyword
				getargs(x, 0, 0, _("modified takes no arguments"))
				s = mctx.status()[0]
				return [f for f in mctx.subset if f in s]

				def added(mctx, x):
				"""``added()``
				File that is added according to status.
				"""
				# i18n: "added" is a keyword
				getargs(x, 0, 0, _("added takes no arguments"))
				s = mctx.status()[1]
				return [f for f in mctx.subset if f in s]

				def removed(mctx, x):
				"""``removed()``
				File that is removed according to status.
				"""
				# i18n: "removed" is a keyword
				getargs(x, 0, 0, _("removed takes no arguments"))
				s = mctx.status()[2]
				return [f for f in mctx.subset if f in s]

				def deleted(mctx, x):
				"""``deleted()``
				File that is deleted according to status.
				"""
				# i18n: "deleted" is a keyword
				getargs(x, 0, 0, _("deleted takes no arguments"))
				s = mctx.status()[3]
				return [f for f in mctx.subset if f in s]

				def unknown(mctx, x):
				"""``unknown()``
				File that is unknown according to status. These files will only be
				considered if this predicate is used.
				"""
				# i18n: "unknown" is a keyword
				getargs(x, 0, 0, _("unknown takes no arguments"))
				s = mctx.status()[4]
				return [f for f in mctx.subset if f in s]

				def ignored(mctx, x):
				"""``ignored()``
				File that is ignored according to status. These files will only be
				considered if this predicate is used.
				"""
				# i18n: "ignored" is a keyword
				getargs(x, 0, 0, _("ignored takes no arguments"))
				s = mctx.status()[5]
				return [f for f in mctx.subset if f in s]

				def clean(mctx, x):
				"""``clean()``
				File that is clean according to status.
				"""
				# i18n: "clean" is a keyword
				getargs(x, 0, 0, _("clean takes no arguments"))
				s = mctx.status()[6]
				return [f for f in mctx.subset if f in s]

				def func(mctx, a, b):
				if a[0] == 'symbol' and a[1] in symbols:
				return symbols[a[1]](mctx, b)
				raise error.ParseError(_("not a function: %s") % a[1])

				def getlist(x):
				if not x:
				return []
				if x[0] == 'list':
				return getlist(x[1]) + [x[2]]
				return [x]

				def getargs(x, min, max, err):
				l = getlist(x)
				if len(l) < min or len(l) > max:
				raise error.ParseError(err)
				return l

				def binary(mctx, x):
				"""``binary()``
				File that appears to be binary (contains NUL bytes).
				"""
				# i18n: "binary" is a keyword
				getargs(x, 0, 0, _("binary takes no arguments"))
				return [f for f in mctx.existing() if util.binary(mctx.ctx[f].data())]

				def exec_(mctx, x):
				"""``exec()``
				File that is marked as executable.
				"""
				# i18n: "exec" is a keyword
				getargs(x, 0, 0, _("exec takes no arguments"))
				return [f for f in mctx.existing() if mctx.ctx.flags(f) == 'x']

				def symlink(mctx, x):
				"""``symlink()``
				File that is marked as a symlink.
				"""
				# i18n: "symlink" is a keyword
				getargs(x, 0, 0, _("symlink takes no arguments"))
				return [f for f in mctx.existing() if mctx.ctx.flags(f) == 'l']

				def resolved(mctx, x):
				"""``resolved()``
				File that is marked resolved according to the resolve state.
				"""
				# i18n: "resolved" is a keyword
				getargs(x, 0, 0, _("resolved takes no arguments"))
				if mctx.ctx.rev() is not None:
				return []
				ms = merge.mergestate(mctx.ctx._repo)
				return [f for f in mctx.subset if f in ms and ms[f] == 'r']

				def unresolved(mctx, x):
				"""``unresolved()``
				File that is marked unresolved according to the resolve state.
				"""
				# i18n: "unresolved" is a keyword
				getargs(x, 0, 0, _("unresolved takes no arguments"))
				if mctx.ctx.rev() is not None:
				return []
				ms = merge.mergestate(mctx.ctx._repo)
				return [f for f in mctx.subset if f in ms and ms[f] == 'u']

				def hgignore(mctx, x):
				"""``hgignore()``
				File that matches the active .hgignore pattern.
				"""
				getargs(x, 0, 0, _("hgignore takes no arguments"))
				ignore = mctx.ctx._repo.dirstate._ignore
				return [f for f in mctx.subset if ignore(f)]

				def grep(mctx, x):
				"""``grep(regex)``
				File contains the given regular expression.
				"""
				pat = getstring(x, _("grep requires a pattern"))
				r = re.compile(pat)
				return [f for f in mctx.existing() if r.search(mctx.ctx[f].data())]

				_units = dict(k=210, K=210, kB=210, KB=210,
				M=220, MB=220, G=230, GB=230)

				def _sizetoint(s):
				try:
				s = s.strip()
				for k, v in _units.items():
				if s.endswith(k):
				return int(float(s[:-len(k)]) * v)
				return int(s)
				except ValueError:
				raise error.ParseError(_("couldn't parse size: %s") % s)

				def _sizetomax(s):
				try:
				s = s.strip()
				for k, v in _units.items():
				if s.endswith(k):
				# max(4k) = 5k - 1, max(4.5k) = 4.6k - 1
				n = s[:-len(k)]
				inc = 1.0
				if "." in n:
				inc /= 10 ** len(n.split(".")[1])
				return int((float(n) + inc) * v) - 1
				# no extension, this is a precise value
				return int(s)
				except ValueError:
				raise error.ParseError(_("couldn't parse size: %s") % s)

				def size(mctx, x):
				"""``size(expression)``
				File size matches the given expression. Examples:

				- 1k (files from 1024 to 2047 bytes)
				- < 20k (files less than 20480 bytes)
				- >= .5MB (files at least 524288 bytes)
				- 4k - 1MB (files from 4096 bytes to 1048576 bytes)
				"""

				# i18n: "size" is a keyword
				expr = getstring(x, _("size requires an expression")).strip()
				if '-' in expr: # do we have a range?
				a, b = expr.split('-', 1)
				a = _sizetoint(a)
				b = _sizetoint(b)
				m = lambda x: x >= a and x <= b
				elif expr.startswith("<="):
				a = _sizetoint(expr[2:])
				m = lambda x: x <= a
				elif expr.startswith("<"):
				a = _sizetoint(expr[1:])
				m = lambda x: x < a
				elif expr.startswith(">="):
				a = _sizetoint(expr[2:])
				m = lambda x: x >= a
				elif expr.startswith(">"):
				a = _sizetoint(expr[1:])
				m = lambda x: x > a
				elif expr[0].isdigit or expr[0] == '.':
				a = _sizetoint(expr)
				b = _sizetomax(expr)
				m = lambda x: x >= a and x <= b
				else:
				raise error.ParseError(_("couldn't parse size: %s") % expr)

				return [f for f in mctx.existing() if m(mctx.ctx[f].size())]

				def encoding(mctx, x):
				"""``encoding(name)``
				File can be successfully decoded with the given character
				encoding. May not be useful for encodings other than ASCII and
				UTF-8.
				"""

				# i18n: "encoding" is a keyword
				enc = getstring(x, _("encoding requires an encoding name"))

				s = []
				for f in mctx.existing():
				d = mctx.ctx[f].data()
				try:
				d.decode(enc)
				except LookupError:
				raise util.Abort(_("unknown encoding '%s'") % enc)
				except UnicodeDecodeError:
				continue
				s.append(f)

				return s

				def copied(mctx, x):
				"""``copied()``
				File that is recorded as being copied.
				"""
				# i18n: "copied" is a keyword
				getargs(x, 0, 0, _("copied takes no arguments"))
				s = []
				for f in mctx.subset:
				p = mctx.ctx[f].parents()
				if p and p[0].path() != f:
				s.append(f)
				return s

				def subrepo(mctx, x):
				"""``subrepo([pattern])``
				Subrepositories whose paths match the given pattern.
				"""
				# i18n: "subrepo" is a keyword
				getargs(x, 0, 1, _("subrepo takes at most one argument"))
				ctx = mctx.ctx
				sstate = ctx.substate
				if x:
				pat = getstring(x, _("subrepo requires a pattern or no arguments"))

				import match as matchmod # avoid circular import issues
				fast = not matchmod.patkind(pat)
				if fast:
				def m(s):
				return (s == pat)
				else:
				m = matchmod.match(ctx._repo.root, '', [pat], ctx=ctx)
				return [sub for sub in sstate if m(sub)]
				else:
				return [sub for sub in sstate]

				symbols = {
				'added': added,
				'binary': binary,
				'clean': clean,
				'copied': copied,
				'deleted': deleted,
				'encoding': encoding,
				'exec': exec_,
				'grep': grep,
				'ignored': ignored,
				'hgignore': hgignore,
				'modified': modified,
				'removed': removed,
				'resolved': resolved,
				'size': size,
				'symlink': symlink,
				'unknown': unknown,
				'unresolved': unresolved,
				'subrepo': subrepo,
				}

				methods = {
				'string': stringset,
				'symbol': stringset,
				'and': andset,
				'or': orset,
				'list': listset,
				'group': getset,
				'not': notset,
				'func': func,
				}

				class matchctx(object):
				def __init__(self, ctx, subset=None, status=None):
				self.ctx = ctx
				self.subset = subset
				self._status = status
				def status(self):
				return self._status
				def matcher(self, patterns):
				return self.ctx.match(patterns)
				def filter(self, files):
				return [f for f in files if f in self.subset]
				def existing(self):
				return (f for f in self.subset if f in self.ctx)
				def narrow(self, files):
				return matchctx(self.ctx, self.filter(files), self._status)

				def _intree(funcs, tree):
				if isinstance(tree, tuple):
				if tree[0] == 'func' and tree[1][0] == 'symbol':
				if tree[1][1] in funcs:
				return True
				for s in tree[1:]:
				if _intree(funcs, s):
				return True
				return False

				def getfileset(ctx, expr):
				tree, pos = parse(expr)
				if (pos != len(expr)):
				raise error.ParseError(_("invalid token"), pos)

				# do we need status info?
				if _intree(['modified', 'added', 'removed', 'deleted',
				'unknown', 'ignored', 'clean'], tree):
				unknown = _intree(['unknown'], tree)
				ignored = _intree(['ignored'], tree)

				r = ctx._repo
				status = r.status(ctx.p1(), ctx,
				unknown=unknown, ignored=ignored, clean=True)
				subset = []
				for c in status:
				subset.extend(c)
				else:
				status = None
				subset = ctx.walk(ctx.match([]))

				return getset(matchctx(ctx, subset, status), tree)

				# tell hggettext to extract docstrings from these functions:
				i18nfunctions = symbols.values()