##// END OF EJS Templates
fileset: copied takes no arguments
Mads Kiilerich -
r14718:0c819486 stable
parent child Browse files
Show More
@@ -1,424 +1,425 b''
1 1 # fileset.py - file set queries for mercurial
2 2 #
3 3 # Copyright 2010 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms of the
6 6 # GNU General Public License version 2 or any later version.
7 7
8 8 import parser, error, util, merge, re
9 9 from i18n import _
10 10
11 11 elements = {
12 12 "(": (20, ("group", 1, ")"), ("func", 1, ")")),
13 13 "-": (5, ("negate", 19), ("minus", 5)),
14 14 "not": (10, ("not", 10)),
15 15 "!": (10, ("not", 10)),
16 16 "and": (5, None, ("and", 5)),
17 17 "&": (5, None, ("and", 5)),
18 18 "or": (4, None, ("or", 4)),
19 19 "|": (4, None, ("or", 4)),
20 20 "+": (4, None, ("or", 4)),
21 21 ",": (2, None, ("list", 2)),
22 22 ")": (0, None, None),
23 23 "symbol": (0, ("symbol",), None),
24 24 "string": (0, ("string",), None),
25 25 "end": (0, None, None),
26 26 }
27 27
28 28 keywords = set(['and', 'or', 'not'])
29 29
30 30 globchars = ".*{}[]?/\\"
31 31
32 32 def tokenize(program):
33 33 pos, l = 0, len(program)
34 34 while pos < l:
35 35 c = program[pos]
36 36 if c.isspace(): # skip inter-token whitespace
37 37 pass
38 38 elif c in "(),-|&+!": # handle simple operators
39 39 yield (c, None, pos)
40 40 elif (c in '"\'' or c == 'r' and
41 41 program[pos:pos + 2] in ("r'", 'r"')): # handle quoted strings
42 42 if c == 'r':
43 43 pos += 1
44 44 c = program[pos]
45 45 decode = lambda x: x
46 46 else:
47 47 decode = lambda x: x.decode('string-escape')
48 48 pos += 1
49 49 s = pos
50 50 while pos < l: # find closing quote
51 51 d = program[pos]
52 52 if d == '\\': # skip over escaped characters
53 53 pos += 2
54 54 continue
55 55 if d == c:
56 56 yield ('string', decode(program[s:pos]), s)
57 57 break
58 58 pos += 1
59 59 else:
60 60 raise error.ParseError(_("unterminated string"), s)
61 61 elif c.isalnum() or c in globchars or ord(c) > 127:
62 62 # gather up a symbol/keyword
63 63 s = pos
64 64 pos += 1
65 65 while pos < l: # find end of symbol
66 66 d = program[pos]
67 67 if not (d.isalnum() or d in globchars or ord(d) > 127):
68 68 break
69 69 pos += 1
70 70 sym = program[s:pos]
71 71 if sym in keywords: # operator keywords
72 72 yield (sym, None, s)
73 73 else:
74 74 yield ('symbol', sym, s)
75 75 pos -= 1
76 76 else:
77 77 raise error.ParseError(_("syntax error"), pos)
78 78 pos += 1
79 79 yield ('end', None, pos)
80 80
81 81 parse = parser.parser(tokenize, elements).parse
82 82
83 83 def getstring(x, err):
84 84 if x and (x[0] == 'string' or x[0] == 'symbol'):
85 85 return x[1]
86 86 raise error.ParseError(err)
87 87
88 88 def getset(mctx, x):
89 89 if not x:
90 90 raise error.ParseError(_("missing argument"))
91 91 return methods[x[0]](mctx, *x[1:])
92 92
93 93 def stringset(mctx, x):
94 94 m = mctx.matcher([x])
95 95 return [f for f in mctx.subset if m(f)]
96 96
97 97 def andset(mctx, x, y):
98 98 return getset(mctx.narrow(getset(mctx, x)), y)
99 99
100 100 def orset(mctx, x, y):
101 101 # needs optimizing
102 102 xl = getset(mctx, x)
103 103 yl = getset(mctx, y)
104 104 return xl + [f for f in yl if f not in xl]
105 105
106 106 def notset(mctx, x):
107 107 s = set(getset(mctx, x))
108 108 return [r for r in mctx.subset if r not in s]
109 109
110 110 def listset(mctx, a, b):
111 111 raise error.ParseError(_("can't use a list in this context"))
112 112
113 113 def modified(mctx, x):
114 114 """``modified()``
115 115 File that is modified according to status.
116 116 """
117 117 getargs(x, 0, 0, _("modified takes no arguments"))
118 118 s = mctx.status()[0]
119 119 return [f for f in mctx.subset if f in s]
120 120
121 121 def added(mctx, x):
122 122 """``added()``
123 123 File that is added according to status.
124 124 """
125 125 getargs(x, 0, 0, _("added takes no arguments"))
126 126 s = mctx.status()[1]
127 127 return [f for f in mctx.subset if f in s]
128 128
129 129 def removed(mctx, x):
130 130 """``removed()``
131 131 File that is removed according to status.
132 132 """
133 133 getargs(x, 0, 0, _("removed takes no arguments"))
134 134 s = mctx.status()[2]
135 135 return [f for f in mctx.subset if f in s]
136 136
137 137 def deleted(mctx, x):
138 138 """``deleted()``
139 139 File that is deleted according to status.
140 140 """
141 141 getargs(x, 0, 0, _("deleted takes no arguments"))
142 142 s = mctx.status()[3]
143 143 return [f for f in mctx.subset if f in s]
144 144
145 145 def unknown(mctx, x):
146 146 """``unknown()``
147 147 File that is unknown according to status. These files will only be
148 148 considered if this predicate is used.
149 149 """
150 150 getargs(x, 0, 0, _("unknown takes no arguments"))
151 151 s = mctx.status()[4]
152 152 return [f for f in mctx.subset if f in s]
153 153
154 154 def ignored(mctx, x):
155 155 """``ignored()``
156 156 File that is ignored according to status. These files will only be
157 157 considered if this predicate is used.
158 158 """
159 159 getargs(x, 0, 0, _("ignored takes no arguments"))
160 160 s = mctx.status()[5]
161 161 return [f for f in mctx.subset if f in s]
162 162
163 163 def clean(mctx, x):
164 164 """``clean()``
165 165 File that is clean according to status.
166 166 """
167 167 getargs(x, 0, 0, _("clean takes no arguments"))
168 168 s = mctx.status()[6]
169 169 return [f for f in mctx.subset if f in s]
170 170
171 171 def func(mctx, a, b):
172 172 if a[0] == 'symbol' and a[1] in symbols:
173 173 return symbols[a[1]](mctx, b)
174 174 raise error.ParseError(_("not a function: %s") % a[1])
175 175
176 176 def getlist(x):
177 177 if not x:
178 178 return []
179 179 if x[0] == 'list':
180 180 return getlist(x[1]) + [x[2]]
181 181 return [x]
182 182
183 183 def getargs(x, min, max, err):
184 184 l = getlist(x)
185 185 if len(l) < min or len(l) > max:
186 186 raise error.ParseError(err)
187 187 return l
188 188
189 189 def binary(mctx, x):
190 190 """``binary()``
191 191 File that appears to be binary (contails NUL bytes).
192 192 """
193 193 getargs(x, 0, 0, _("binary takes no arguments"))
194 194 return [f for f in mctx.subset if util.binary(mctx.ctx[f].data())]
195 195
196 196 def exec_(mctx, x):
197 197 """``exec()``
198 198 File that is marked as executable.
199 199 """
200 200 getargs(x, 0, 0, _("exec takes no arguments"))
201 201 return [f for f in mctx.subset if mctx.ctx.flags(f) == 'x']
202 202
203 203 def symlink(mctx, x):
204 204 """``symlink()``
205 205 File that is marked as a symlink.
206 206 """
207 207 getargs(x, 0, 0, _("symlink takes no arguments"))
208 208 return [f for f in mctx.subset if mctx.ctx.flags(f) == 'l']
209 209
210 210 def resolved(mctx, x):
211 211 """``resolved()``
212 212 File that is marked resolved according to the resolve state.
213 213 """
214 214 getargs(x, 0, 0, _("resolved takes no arguments"))
215 215 if mctx.ctx.rev() is not None:
216 216 return []
217 217 ms = merge.mergestate(mctx.ctx._repo)
218 218 return [f for f in mctx.subset if f in ms and ms[f] == 'r']
219 219
220 220 def unresolved(mctx, x):
221 221 """``unresolved()``
222 222 File that is marked unresolved according to the resolve state.
223 223 """
224 224 getargs(x, 0, 0, _("unresolved takes no arguments"))
225 225 if mctx.ctx.rev() is not None:
226 226 return []
227 227 ms = merge.mergestate(mctx.ctx._repo)
228 228 return [f for f in mctx.subset if f in ms and ms[f] == 'u']
229 229
230 230 def hgignore(mctx, x):
231 231 """``hgignore()``
232 232 File that matches the active .hgignore pattern.
233 233 """
234 234 getargs(x, 0, 0, _("hgignore takes no arguments"))
235 235 ignore = mctx.ctx._repo.dirstate._ignore
236 236 return [f for f in mctx.subset if ignore(f)]
237 237
238 238 def grep(mctx, x):
239 239 """``grep(regex)``
240 240 File contains the given regular expression.
241 241 """
242 242 pat = getstring(x, _("grep requires a pattern"))
243 243 r = re.compile(pat)
244 244 return [f for f in mctx.subset if r.search(mctx.ctx[f].data())]
245 245
246 246 _units = dict(k=2**10, K=2**10, kB=2**10, KB=2**10,
247 247 M=2**20, MB=2**20, G=2**30, GB=2**30)
248 248
249 249 def _sizetoint(s):
250 250 try:
251 251 s = s.strip()
252 252 for k, v in _units.items():
253 253 if s.endswith(k):
254 254 return int(float(s[:-len(k)]) * v)
255 255 return int(s)
256 256 except ValueError:
257 257 raise error.ParseError(_("couldn't parse size: %s") % s)
258 258
259 259 def _sizetomax(s):
260 260 try:
261 261 s = s.strip()
262 262 for k, v in _units.items():
263 263 if s.endswith(k):
264 264 # max(4k) = 5k - 1, max(4.5k) = 4.6k - 1
265 265 n = s[:-len(k)]
266 266 inc = 1.0
267 267 if "." in n:
268 268 inc /= 10 ** len(n.split(".")[1])
269 269 return int((float(n) + inc) * v) - 1
270 270 # no extension, this is a precise value
271 271 return int(s)
272 272 except ValueError:
273 273 raise error.ParseError(_("couldn't parse size: %s") % s)
274 274
275 275 def size(mctx, x):
276 276 """``size(expression)``
277 277 File size matches the given expression. Examples:
278 278
279 279 - 1k (files from 1024 to 2047 bytes)
280 280 - < 20k (files less than 20480 bytes)
281 281 - >= .5MB (files at least 524288 bytes)
282 282 - 4k - 1MB (files from 4096 bytes to 1048576 bytes)
283 283 """
284 284
285 285 expr = getstring(x, _("size requires an expression")).strip()
286 286 if '-' in expr: # do we have a range?
287 287 a, b = expr.split('-', 1)
288 288 a = _sizetoint(a)
289 289 b = _sizetoint(b)
290 290 m = lambda x: x >= a and x <= b
291 291 elif expr.startswith("<="):
292 292 a = _sizetoint(expr[2:])
293 293 m = lambda x: x <= a
294 294 elif expr.startswith("<"):
295 295 a = _sizetoint(expr[1:])
296 296 m = lambda x: x < a
297 297 elif expr.startswith(">="):
298 298 a = _sizetoint(expr[2:])
299 299 m = lambda x: x >= a
300 300 elif expr.startswith(">"):
301 301 a = _sizetoint(expr[1:])
302 302 m = lambda x: x > a
303 303 elif expr[0].isdigit or expr[0] == '.':
304 304 a = _sizetoint(expr)
305 305 b = _sizetomax(expr)
306 306 m = lambda x: x >= a and x <= b
307 307 else:
308 308 raise error.ParseError(_("couldn't parse size: %s") % expr)
309 309
310 310 return [f for f in mctx.subset if m(mctx.ctx[f].size())]
311 311
312 312 def encoding(mctx, x):
313 313 """``encoding(name)``
314 314 File can be successfully decoded with the given character
315 315 encoding. May not be useful for encodings other than ASCII and
316 316 UTF-8.
317 317 """
318 318
319 319 enc = getstring(x, _("encoding requires an encoding name"))
320 320
321 321 s = []
322 322 for f in mctx.subset:
323 323 d = mctx.ctx[f].data()
324 324 try:
325 325 d.decode(enc)
326 326 except LookupError:
327 327 raise util.Abort(_("unknown encoding '%s'") % enc)
328 328 except UnicodeDecodeError:
329 329 continue
330 330 s.append(f)
331 331
332 332 return s
333 333
334 334 def copied(mctx, x):
335 335 """``copied()``
336 336 File that is recorded as being copied.
337 337 """
338 getargs(x, 0, 0, _("copied takes no arguments"))
338 339 s = []
339 340 for f in mctx.subset:
340 341 p = mctx.ctx[f].parents()
341 342 if p and p[0].path() != f:
342 343 s.append(f)
343 344 return s
344 345
345 346 symbols = {
346 347 'added': added,
347 348 'binary': binary,
348 349 'clean': clean,
349 350 'copied': copied,
350 351 'deleted': deleted,
351 352 'encoding': encoding,
352 353 'exec': exec_,
353 354 'grep': grep,
354 355 'ignored': ignored,
355 356 'hgignore': hgignore,
356 357 'modified': modified,
357 358 'removed': removed,
358 359 'resolved': resolved,
359 360 'size': size,
360 361 'symlink': symlink,
361 362 'unknown': unknown,
362 363 'unresolved': unresolved,
363 364 }
364 365
365 366 methods = {
366 367 'string': stringset,
367 368 'symbol': stringset,
368 369 'and': andset,
369 370 'or': orset,
370 371 'list': listset,
371 372 'group': getset,
372 373 'not': notset,
373 374 'func': func,
374 375 }
375 376
376 377 class matchctx(object):
377 378 def __init__(self, ctx, subset=None, status=None):
378 379 self.ctx = ctx
379 380 self.subset = subset
380 381 self._status = status
381 382 def status(self):
382 383 return self._status
383 384 def matcher(self, patterns):
384 385 return self.ctx.match(patterns)
385 386 def filter(self, files):
386 387 return [f for f in files if f in self.subset]
387 388 def narrow(self, files):
388 389 return matchctx(self.ctx, self.filter(files), self._status)
389 390
390 391 def _intree(funcs, tree):
391 392 if isinstance(tree, tuple):
392 393 if tree[0] == 'func' and tree[1][0] == 'symbol':
393 394 if tree[1][1] in funcs:
394 395 return True
395 396 for s in tree[1:]:
396 397 if _intree(funcs, s):
397 398 return True
398 399 return False
399 400
400 401 def getfileset(ctx, expr):
401 402 tree, pos = parse(expr)
402 403 if (pos != len(expr)):
403 404 raise error.ParseError(_("invalid token"), pos)
404 405
405 406 # do we need status info?
406 407 if _intree(['modified', 'added', 'removed', 'deleted',
407 408 'unknown', 'ignored', 'clean'], tree):
408 409 unknown = _intree(['unknown'], tree)
409 410 ignored = _intree(['ignored'], tree)
410 411
411 412 r = ctx._repo
412 413 status = r.status(ctx.p1(), ctx,
413 414 unknown=unknown, ignored=ignored, clean=True)
414 415 subset = []
415 416 for c in status:
416 417 subset.extend(c)
417 418 else:
418 419 status = None
419 420 subset = ctx.walk(ctx.match([]))
420 421
421 422 return getset(matchctx(ctx, subset, status), tree)
422 423
423 424 # tell hggettext to extract docstrings from these functions:
424 425 i18nfunctions = symbols.values()
General Comments 0
You need to be logged in to leave comments. Login now