##// END OF EJS Templates
dirstate: use self._filename instead of immediate string `dirstate`...
FUJIWARA Katsunori -
r25226:00d426a3 default
parent child Browse files
Show More
@@ -1,987 +1,988
1 1 # dirstate.py - working directory tracking for mercurial
2 2 #
3 3 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms of the
6 6 # GNU General Public License version 2 or any later version.
7 7
8 8 from node import nullid
9 9 from i18n import _
10 10 import scmutil, util, osutil, parsers, encoding, pathutil
11 11 import os, stat, errno
12 12 import match as matchmod
13 13
14 14 propertycache = util.propertycache
15 15 filecache = scmutil.filecache
16 16 _rangemask = 0x7fffffff
17 17
18 18 dirstatetuple = parsers.dirstatetuple
19 19
20 20 class repocache(filecache):
21 21 """filecache for files in .hg/"""
22 22 def join(self, obj, fname):
23 23 return obj._opener.join(fname)
24 24
25 25 class rootcache(filecache):
26 26 """filecache for files in the repository root"""
27 27 def join(self, obj, fname):
28 28 return obj._join(fname)
29 29
30 30 class dirstate(object):
31 31
32 32 def __init__(self, opener, ui, root, validate):
33 33 '''Create a new dirstate object.
34 34
35 35 opener is an open()-like callable that can be used to open the
36 36 dirstate file; root is the root of the directory tracked by
37 37 the dirstate.
38 38 '''
39 39 self._opener = opener
40 40 self._validate = validate
41 41 self._root = root
42 42 # ntpath.join(root, '') of Python 2.7.9 does not add sep if root is
43 43 # UNC path pointing to root share (issue4557)
44 44 self._rootdir = pathutil.normasprefix(root)
45 45 self._dirty = False
46 46 self._dirtypl = False
47 47 self._lastnormaltime = 0
48 48 self._ui = ui
49 49 self._filecache = {}
50 50 self._parentwriters = 0
51 self._filename = 'dirstate'
51 52
52 53 def beginparentchange(self):
53 54 '''Marks the beginning of a set of changes that involve changing
54 55 the dirstate parents. If there is an exception during this time,
55 56 the dirstate will not be written when the wlock is released. This
56 57 prevents writing an incoherent dirstate where the parent doesn't
57 58 match the contents.
58 59 '''
59 60 self._parentwriters += 1
60 61
61 62 def endparentchange(self):
62 63 '''Marks the end of a set of changes that involve changing the
63 64 dirstate parents. Once all parent changes have been marked done,
64 65 the wlock will be free to write the dirstate on release.
65 66 '''
66 67 if self._parentwriters > 0:
67 68 self._parentwriters -= 1
68 69
69 70 def pendingparentchange(self):
70 71 '''Returns true if the dirstate is in the middle of a set of changes
71 72 that modify the dirstate parent.
72 73 '''
73 74 return self._parentwriters > 0
74 75
75 76 @propertycache
76 77 def _map(self):
77 78 '''Return the dirstate contents as a map from filename to
78 79 (state, mode, size, time).'''
79 80 self._read()
80 81 return self._map
81 82
82 83 @propertycache
83 84 def _copymap(self):
84 85 self._read()
85 86 return self._copymap
86 87
87 88 @propertycache
88 89 def _filefoldmap(self):
89 90 try:
90 91 makefilefoldmap = parsers.make_file_foldmap
91 92 except AttributeError:
92 93 pass
93 94 else:
94 95 return makefilefoldmap(self._map, util.normcasespec,
95 96 util.normcasefallback)
96 97
97 98 f = {}
98 99 normcase = util.normcase
99 100 for name, s in self._map.iteritems():
100 101 if s[0] != 'r':
101 102 f[normcase(name)] = name
102 103 f['.'] = '.' # prevents useless util.fspath() invocation
103 104 return f
104 105
105 106 @propertycache
106 107 def _dirfoldmap(self):
107 108 f = {}
108 109 normcase = util.normcase
109 110 for name in self._dirs:
110 111 f[normcase(name)] = name
111 112 return f
112 113
113 114 @repocache('branch')
114 115 def _branch(self):
115 116 try:
116 117 return self._opener.read("branch").strip() or "default"
117 118 except IOError, inst:
118 119 if inst.errno != errno.ENOENT:
119 120 raise
120 121 return "default"
121 122
122 123 @propertycache
123 124 def _pl(self):
124 125 try:
125 fp = self._opener("dirstate")
126 fp = self._opener(self._filename)
126 127 st = fp.read(40)
127 128 fp.close()
128 129 l = len(st)
129 130 if l == 40:
130 131 return st[:20], st[20:40]
131 132 elif l > 0 and l < 40:
132 133 raise util.Abort(_('working directory state appears damaged!'))
133 134 except IOError, err:
134 135 if err.errno != errno.ENOENT:
135 136 raise
136 137 return [nullid, nullid]
137 138
138 139 @propertycache
139 140 def _dirs(self):
140 141 return util.dirs(self._map, 'r')
141 142
142 143 def dirs(self):
143 144 return self._dirs
144 145
145 146 @rootcache('.hgignore')
146 147 def _ignore(self):
147 148 files = []
148 149 if os.path.exists(self._join('.hgignore')):
149 150 files.append(self._join('.hgignore'))
150 151 for name, path in self._ui.configitems("ui"):
151 152 if name == 'ignore' or name.startswith('ignore.'):
152 153 # we need to use os.path.join here rather than self._join
153 154 # because path is arbitrary and user-specified
154 155 files.append(os.path.join(self._rootdir, util.expandpath(path)))
155 156
156 157 if not files:
157 158 return util.never
158 159
159 160 pats = ['include:%s' % f for f in files]
160 161 return matchmod.match(self._root, '', [], pats, warn=self._ui.warn)
161 162
162 163 @propertycache
163 164 def _slash(self):
164 165 return self._ui.configbool('ui', 'slash') and os.sep != '/'
165 166
166 167 @propertycache
167 168 def _checklink(self):
168 169 return util.checklink(self._root)
169 170
170 171 @propertycache
171 172 def _checkexec(self):
172 173 return util.checkexec(self._root)
173 174
174 175 @propertycache
175 176 def _checkcase(self):
176 177 return not util.checkcase(self._join('.hg'))
177 178
178 179 def _join(self, f):
179 180 # much faster than os.path.join()
180 181 # it's safe because f is always a relative path
181 182 return self._rootdir + f
182 183
183 184 def flagfunc(self, buildfallback):
184 185 if self._checklink and self._checkexec:
185 186 def f(x):
186 187 try:
187 188 st = os.lstat(self._join(x))
188 189 if util.statislink(st):
189 190 return 'l'
190 191 if util.statisexec(st):
191 192 return 'x'
192 193 except OSError:
193 194 pass
194 195 return ''
195 196 return f
196 197
197 198 fallback = buildfallback()
198 199 if self._checklink:
199 200 def f(x):
200 201 if os.path.islink(self._join(x)):
201 202 return 'l'
202 203 if 'x' in fallback(x):
203 204 return 'x'
204 205 return ''
205 206 return f
206 207 if self._checkexec:
207 208 def f(x):
208 209 if 'l' in fallback(x):
209 210 return 'l'
210 211 if util.isexec(self._join(x)):
211 212 return 'x'
212 213 return ''
213 214 return f
214 215 else:
215 216 return fallback
216 217
217 218 @propertycache
218 219 def _cwd(self):
219 220 return os.getcwd()
220 221
221 222 def getcwd(self):
222 223 cwd = self._cwd
223 224 if cwd == self._root:
224 225 return ''
225 226 # self._root ends with a path separator if self._root is '/' or 'C:\'
226 227 rootsep = self._root
227 228 if not util.endswithsep(rootsep):
228 229 rootsep += os.sep
229 230 if cwd.startswith(rootsep):
230 231 return cwd[len(rootsep):]
231 232 else:
232 233 # we're outside the repo. return an absolute path.
233 234 return cwd
234 235
235 236 def pathto(self, f, cwd=None):
236 237 if cwd is None:
237 238 cwd = self.getcwd()
238 239 path = util.pathto(self._root, cwd, f)
239 240 if self._slash:
240 241 return util.pconvert(path)
241 242 return path
242 243
243 244 def __getitem__(self, key):
244 245 '''Return the current state of key (a filename) in the dirstate.
245 246
246 247 States are:
247 248 n normal
248 249 m needs merging
249 250 r marked for removal
250 251 a marked for addition
251 252 ? not tracked
252 253 '''
253 254 return self._map.get(key, ("?",))[0]
254 255
255 256 def __contains__(self, key):
256 257 return key in self._map
257 258
258 259 def __iter__(self):
259 260 for x in sorted(self._map):
260 261 yield x
261 262
262 263 def iteritems(self):
263 264 return self._map.iteritems()
264 265
265 266 def parents(self):
266 267 return [self._validate(p) for p in self._pl]
267 268
268 269 def p1(self):
269 270 return self._validate(self._pl[0])
270 271
271 272 def p2(self):
272 273 return self._validate(self._pl[1])
273 274
274 275 def branch(self):
275 276 return encoding.tolocal(self._branch)
276 277
277 278 def setparents(self, p1, p2=nullid):
278 279 """Set dirstate parents to p1 and p2.
279 280
280 281 When moving from two parents to one, 'm' merged entries a
281 282 adjusted to normal and previous copy records discarded and
282 283 returned by the call.
283 284
284 285 See localrepo.setparents()
285 286 """
286 287 if self._parentwriters == 0:
287 288 raise ValueError("cannot set dirstate parent without "
288 289 "calling dirstate.beginparentchange")
289 290
290 291 self._dirty = self._dirtypl = True
291 292 oldp2 = self._pl[1]
292 293 self._pl = p1, p2
293 294 copies = {}
294 295 if oldp2 != nullid and p2 == nullid:
295 296 for f, s in self._map.iteritems():
296 297 # Discard 'm' markers when moving away from a merge state
297 298 if s[0] == 'm':
298 299 if f in self._copymap:
299 300 copies[f] = self._copymap[f]
300 301 self.normallookup(f)
301 302 # Also fix up otherparent markers
302 303 elif s[0] == 'n' and s[2] == -2:
303 304 if f in self._copymap:
304 305 copies[f] = self._copymap[f]
305 306 self.add(f)
306 307 return copies
307 308
308 309 def setbranch(self, branch):
309 310 self._branch = encoding.fromlocal(branch)
310 311 f = self._opener('branch', 'w', atomictemp=True)
311 312 try:
312 313 f.write(self._branch + '\n')
313 314 f.close()
314 315
315 316 # make sure filecache has the correct stat info for _branch after
316 317 # replacing the underlying file
317 318 ce = self._filecache['_branch']
318 319 if ce:
319 320 ce.refresh()
320 321 except: # re-raises
321 322 f.discard()
322 323 raise
323 324
324 325 def _read(self):
325 326 self._map = {}
326 327 self._copymap = {}
327 328 try:
328 st = self._opener.read("dirstate")
329 st = self._opener.read(self._filename)
329 330 except IOError, err:
330 331 if err.errno != errno.ENOENT:
331 332 raise
332 333 return
333 334 if not st:
334 335 return
335 336
336 337 # Python's garbage collector triggers a GC each time a certain number
337 338 # of container objects (the number being defined by
338 339 # gc.get_threshold()) are allocated. parse_dirstate creates a tuple
339 340 # for each file in the dirstate. The C version then immediately marks
340 341 # them as not to be tracked by the collector. However, this has no
341 342 # effect on when GCs are triggered, only on what objects the GC looks
342 343 # into. This means that O(number of files) GCs are unavoidable.
343 344 # Depending on when in the process's lifetime the dirstate is parsed,
344 345 # this can get very expensive. As a workaround, disable GC while
345 346 # parsing the dirstate.
346 347 #
347 348 # (we cannot decorate the function directly since it is in a C module)
348 349 parse_dirstate = util.nogc(parsers.parse_dirstate)
349 350 p = parse_dirstate(self._map, self._copymap, st)
350 351 if not self._dirtypl:
351 352 self._pl = p
352 353
353 354 def invalidate(self):
354 355 for a in ("_map", "_copymap", "_filefoldmap", "_dirfoldmap", "_branch",
355 356 "_pl", "_dirs", "_ignore"):
356 357 if a in self.__dict__:
357 358 delattr(self, a)
358 359 self._lastnormaltime = 0
359 360 self._dirty = False
360 361 self._parentwriters = 0
361 362
362 363 def copy(self, source, dest):
363 364 """Mark dest as a copy of source. Unmark dest if source is None."""
364 365 if source == dest:
365 366 return
366 367 self._dirty = True
367 368 if source is not None:
368 369 self._copymap[dest] = source
369 370 elif dest in self._copymap:
370 371 del self._copymap[dest]
371 372
372 373 def copied(self, file):
373 374 return self._copymap.get(file, None)
374 375
375 376 def copies(self):
376 377 return self._copymap
377 378
378 379 def _droppath(self, f):
379 380 if self[f] not in "?r" and "_dirs" in self.__dict__:
380 381 self._dirs.delpath(f)
381 382
382 383 def _addpath(self, f, state, mode, size, mtime):
383 384 oldstate = self[f]
384 385 if state == 'a' or oldstate == 'r':
385 386 scmutil.checkfilename(f)
386 387 if f in self._dirs:
387 388 raise util.Abort(_('directory %r already in dirstate') % f)
388 389 # shadows
389 390 for d in util.finddirs(f):
390 391 if d in self._dirs:
391 392 break
392 393 if d in self._map and self[d] != 'r':
393 394 raise util.Abort(
394 395 _('file %r in dirstate clashes with %r') % (d, f))
395 396 if oldstate in "?r" and "_dirs" in self.__dict__:
396 397 self._dirs.addpath(f)
397 398 self._dirty = True
398 399 self._map[f] = dirstatetuple(state, mode, size, mtime)
399 400
400 401 def normal(self, f):
401 402 '''Mark a file normal and clean.'''
402 403 s = os.lstat(self._join(f))
403 404 mtime = int(s.st_mtime)
404 405 self._addpath(f, 'n', s.st_mode,
405 406 s.st_size & _rangemask, mtime & _rangemask)
406 407 if f in self._copymap:
407 408 del self._copymap[f]
408 409 if mtime > self._lastnormaltime:
409 410 # Remember the most recent modification timeslot for status(),
410 411 # to make sure we won't miss future size-preserving file content
411 412 # modifications that happen within the same timeslot.
412 413 self._lastnormaltime = mtime
413 414
414 415 def normallookup(self, f):
415 416 '''Mark a file normal, but possibly dirty.'''
416 417 if self._pl[1] != nullid and f in self._map:
417 418 # if there is a merge going on and the file was either
418 419 # in state 'm' (-1) or coming from other parent (-2) before
419 420 # being removed, restore that state.
420 421 entry = self._map[f]
421 422 if entry[0] == 'r' and entry[2] in (-1, -2):
422 423 source = self._copymap.get(f)
423 424 if entry[2] == -1:
424 425 self.merge(f)
425 426 elif entry[2] == -2:
426 427 self.otherparent(f)
427 428 if source:
428 429 self.copy(source, f)
429 430 return
430 431 if entry[0] == 'm' or entry[0] == 'n' and entry[2] == -2:
431 432 return
432 433 self._addpath(f, 'n', 0, -1, -1)
433 434 if f in self._copymap:
434 435 del self._copymap[f]
435 436
436 437 def otherparent(self, f):
437 438 '''Mark as coming from the other parent, always dirty.'''
438 439 if self._pl[1] == nullid:
439 440 raise util.Abort(_("setting %r to other parent "
440 441 "only allowed in merges") % f)
441 442 if f in self and self[f] == 'n':
442 443 # merge-like
443 444 self._addpath(f, 'm', 0, -2, -1)
444 445 else:
445 446 # add-like
446 447 self._addpath(f, 'n', 0, -2, -1)
447 448
448 449 if f in self._copymap:
449 450 del self._copymap[f]
450 451
451 452 def add(self, f):
452 453 '''Mark a file added.'''
453 454 self._addpath(f, 'a', 0, -1, -1)
454 455 if f in self._copymap:
455 456 del self._copymap[f]
456 457
457 458 def remove(self, f):
458 459 '''Mark a file removed.'''
459 460 self._dirty = True
460 461 self._droppath(f)
461 462 size = 0
462 463 if self._pl[1] != nullid and f in self._map:
463 464 # backup the previous state
464 465 entry = self._map[f]
465 466 if entry[0] == 'm': # merge
466 467 size = -1
467 468 elif entry[0] == 'n' and entry[2] == -2: # other parent
468 469 size = -2
469 470 self._map[f] = dirstatetuple('r', 0, size, 0)
470 471 if size == 0 and f in self._copymap:
471 472 del self._copymap[f]
472 473
473 474 def merge(self, f):
474 475 '''Mark a file merged.'''
475 476 if self._pl[1] == nullid:
476 477 return self.normallookup(f)
477 478 return self.otherparent(f)
478 479
479 480 def drop(self, f):
480 481 '''Drop a file from the dirstate'''
481 482 if f in self._map:
482 483 self._dirty = True
483 484 self._droppath(f)
484 485 del self._map[f]
485 486
486 487 def _discoverpath(self, path, normed, ignoremissing, exists, storemap):
487 488 if exists is None:
488 489 exists = os.path.lexists(os.path.join(self._root, path))
489 490 if not exists:
490 491 # Maybe a path component exists
491 492 if not ignoremissing and '/' in path:
492 493 d, f = path.rsplit('/', 1)
493 494 d = self._normalize(d, False, ignoremissing, None)
494 495 folded = d + "/" + f
495 496 else:
496 497 # No path components, preserve original case
497 498 folded = path
498 499 else:
499 500 # recursively normalize leading directory components
500 501 # against dirstate
501 502 if '/' in normed:
502 503 d, f = normed.rsplit('/', 1)
503 504 d = self._normalize(d, False, ignoremissing, True)
504 505 r = self._root + "/" + d
505 506 folded = d + "/" + util.fspath(f, r)
506 507 else:
507 508 folded = util.fspath(normed, self._root)
508 509 storemap[normed] = folded
509 510
510 511 return folded
511 512
512 513 def _normalizefile(self, path, isknown, ignoremissing=False, exists=None):
513 514 normed = util.normcase(path)
514 515 folded = self._filefoldmap.get(normed, None)
515 516 if folded is None:
516 517 if isknown:
517 518 folded = path
518 519 else:
519 520 folded = self._discoverpath(path, normed, ignoremissing, exists,
520 521 self._filefoldmap)
521 522 return folded
522 523
523 524 def _normalize(self, path, isknown, ignoremissing=False, exists=None):
524 525 normed = util.normcase(path)
525 526 folded = self._filefoldmap.get(normed, None)
526 527 if folded is None:
527 528 folded = self._dirfoldmap.get(normed, None)
528 529 if folded is None:
529 530 if isknown:
530 531 folded = path
531 532 else:
532 533 # store discovered result in dirfoldmap so that future
533 534 # normalizefile calls don't start matching directories
534 535 folded = self._discoverpath(path, normed, ignoremissing, exists,
535 536 self._dirfoldmap)
536 537 return folded
537 538
538 539 def normalize(self, path, isknown=False, ignoremissing=False):
539 540 '''
540 541 normalize the case of a pathname when on a casefolding filesystem
541 542
542 543 isknown specifies whether the filename came from walking the
543 544 disk, to avoid extra filesystem access.
544 545
545 546 If ignoremissing is True, missing path are returned
546 547 unchanged. Otherwise, we try harder to normalize possibly
547 548 existing path components.
548 549
549 550 The normalized case is determined based on the following precedence:
550 551
551 552 - version of name already stored in the dirstate
552 553 - version of name stored on disk
553 554 - version provided via command arguments
554 555 '''
555 556
556 557 if self._checkcase:
557 558 return self._normalize(path, isknown, ignoremissing)
558 559 return path
559 560
560 561 def clear(self):
561 562 self._map = {}
562 563 if "_dirs" in self.__dict__:
563 564 delattr(self, "_dirs")
564 565 self._copymap = {}
565 566 self._pl = [nullid, nullid]
566 567 self._lastnormaltime = 0
567 568 self._dirty = True
568 569
569 570 def rebuild(self, parent, allfiles, changedfiles=None):
570 571 changedfiles = changedfiles or allfiles
571 572 oldmap = self._map
572 573 self.clear()
573 574 for f in allfiles:
574 575 if f not in changedfiles:
575 576 self._map[f] = oldmap[f]
576 577 else:
577 578 if 'x' in allfiles.flags(f):
578 579 self._map[f] = dirstatetuple('n', 0777, -1, 0)
579 580 else:
580 581 self._map[f] = dirstatetuple('n', 0666, -1, 0)
581 582 self._pl = (parent, nullid)
582 583 self._dirty = True
583 584
584 585 def write(self):
585 586 if not self._dirty:
586 587 return
587 588
588 589 # enough 'delaywrite' prevents 'pack_dirstate' from dropping
589 590 # timestamp of each entries in dirstate, because of 'now > mtime'
590 591 delaywrite = self._ui.configint('debug', 'dirstate.delaywrite', 0)
591 592 if delaywrite > 0:
592 593 import time # to avoid useless import
593 594 time.sleep(delaywrite)
594 595
595 st = self._opener("dirstate", "w", atomictemp=True)
596 st = self._opener(self._filename, "w", atomictemp=True)
596 597 # use the modification time of the newly created temporary file as the
597 598 # filesystem's notion of 'now'
598 599 now = util.fstat(st).st_mtime
599 600 st.write(parsers.pack_dirstate(self._map, self._copymap, self._pl, now))
600 601 st.close()
601 602 self._lastnormaltime = 0
602 603 self._dirty = self._dirtypl = False
603 604
604 605 def _dirignore(self, f):
605 606 if f == '.':
606 607 return False
607 608 if self._ignore(f):
608 609 return True
609 610 for p in util.finddirs(f):
610 611 if self._ignore(p):
611 612 return True
612 613 return False
613 614
614 615 def _walkexplicit(self, match, subrepos):
615 616 '''Get stat data about the files explicitly specified by match.
616 617
617 618 Return a triple (results, dirsfound, dirsnotfound).
618 619 - results is a mapping from filename to stat result. It also contains
619 620 listings mapping subrepos and .hg to None.
620 621 - dirsfound is a list of files found to be directories.
621 622 - dirsnotfound is a list of files that the dirstate thinks are
622 623 directories and that were not found.'''
623 624
624 625 def badtype(mode):
625 626 kind = _('unknown')
626 627 if stat.S_ISCHR(mode):
627 628 kind = _('character device')
628 629 elif stat.S_ISBLK(mode):
629 630 kind = _('block device')
630 631 elif stat.S_ISFIFO(mode):
631 632 kind = _('fifo')
632 633 elif stat.S_ISSOCK(mode):
633 634 kind = _('socket')
634 635 elif stat.S_ISDIR(mode):
635 636 kind = _('directory')
636 637 return _('unsupported file type (type is %s)') % kind
637 638
638 639 matchedir = match.explicitdir
639 640 badfn = match.bad
640 641 dmap = self._map
641 642 lstat = os.lstat
642 643 getkind = stat.S_IFMT
643 644 dirkind = stat.S_IFDIR
644 645 regkind = stat.S_IFREG
645 646 lnkkind = stat.S_IFLNK
646 647 join = self._join
647 648 dirsfound = []
648 649 foundadd = dirsfound.append
649 650 dirsnotfound = []
650 651 notfoundadd = dirsnotfound.append
651 652
652 653 if not match.isexact() and self._checkcase:
653 654 normalize = self._normalize
654 655 else:
655 656 normalize = None
656 657
657 658 files = sorted(match.files())
658 659 subrepos.sort()
659 660 i, j = 0, 0
660 661 while i < len(files) and j < len(subrepos):
661 662 subpath = subrepos[j] + "/"
662 663 if files[i] < subpath:
663 664 i += 1
664 665 continue
665 666 while i < len(files) and files[i].startswith(subpath):
666 667 del files[i]
667 668 j += 1
668 669
669 670 if not files or '.' in files:
670 671 files = ['.']
671 672 results = dict.fromkeys(subrepos)
672 673 results['.hg'] = None
673 674
674 675 alldirs = None
675 676 for ff in files:
676 677 # constructing the foldmap is expensive, so don't do it for the
677 678 # common case where files is ['.']
678 679 if normalize and ff != '.':
679 680 nf = normalize(ff, False, True)
680 681 else:
681 682 nf = ff
682 683 if nf in results:
683 684 continue
684 685
685 686 try:
686 687 st = lstat(join(nf))
687 688 kind = getkind(st.st_mode)
688 689 if kind == dirkind:
689 690 if nf in dmap:
690 691 # file replaced by dir on disk but still in dirstate
691 692 results[nf] = None
692 693 if matchedir:
693 694 matchedir(nf)
694 695 foundadd((nf, ff))
695 696 elif kind == regkind or kind == lnkkind:
696 697 results[nf] = st
697 698 else:
698 699 badfn(ff, badtype(kind))
699 700 if nf in dmap:
700 701 results[nf] = None
701 702 except OSError, inst: # nf not found on disk - it is dirstate only
702 703 if nf in dmap: # does it exactly match a missing file?
703 704 results[nf] = None
704 705 else: # does it match a missing directory?
705 706 if alldirs is None:
706 707 alldirs = util.dirs(dmap)
707 708 if nf in alldirs:
708 709 if matchedir:
709 710 matchedir(nf)
710 711 notfoundadd(nf)
711 712 else:
712 713 badfn(ff, inst.strerror)
713 714
714 715 return results, dirsfound, dirsnotfound
715 716
716 717 def walk(self, match, subrepos, unknown, ignored, full=True):
717 718 '''
718 719 Walk recursively through the directory tree, finding all files
719 720 matched by match.
720 721
721 722 If full is False, maybe skip some known-clean files.
722 723
723 724 Return a dict mapping filename to stat-like object (either
724 725 mercurial.osutil.stat instance or return value of os.stat()).
725 726
726 727 '''
727 728 # full is a flag that extensions that hook into walk can use -- this
728 729 # implementation doesn't use it at all. This satisfies the contract
729 730 # because we only guarantee a "maybe".
730 731
731 732 if ignored:
732 733 ignore = util.never
733 734 dirignore = util.never
734 735 elif unknown:
735 736 ignore = self._ignore
736 737 dirignore = self._dirignore
737 738 else:
738 739 # if not unknown and not ignored, drop dir recursion and step 2
739 740 ignore = util.always
740 741 dirignore = util.always
741 742
742 743 matchfn = match.matchfn
743 744 matchalways = match.always()
744 745 matchtdir = match.traversedir
745 746 dmap = self._map
746 747 listdir = osutil.listdir
747 748 lstat = os.lstat
748 749 dirkind = stat.S_IFDIR
749 750 regkind = stat.S_IFREG
750 751 lnkkind = stat.S_IFLNK
751 752 join = self._join
752 753
753 754 exact = skipstep3 = False
754 755 if match.isexact(): # match.exact
755 756 exact = True
756 757 dirignore = util.always # skip step 2
757 758 elif match.files() and not match.anypats(): # match.match, no patterns
758 759 skipstep3 = True
759 760
760 761 if not exact and self._checkcase:
761 762 normalize = self._normalize
762 763 normalizefile = self._normalizefile
763 764 skipstep3 = False
764 765 else:
765 766 normalize = self._normalize
766 767 normalizefile = None
767 768
768 769 # step 1: find all explicit files
769 770 results, work, dirsnotfound = self._walkexplicit(match, subrepos)
770 771
771 772 skipstep3 = skipstep3 and not (work or dirsnotfound)
772 773 work = [d for d in work if not dirignore(d[0])]
773 774
774 775 # step 2: visit subdirectories
775 776 def traverse(work, alreadynormed):
776 777 wadd = work.append
777 778 while work:
778 779 nd = work.pop()
779 780 skip = None
780 781 if nd == '.':
781 782 nd = ''
782 783 else:
783 784 skip = '.hg'
784 785 try:
785 786 entries = listdir(join(nd), stat=True, skip=skip)
786 787 except OSError, inst:
787 788 if inst.errno in (errno.EACCES, errno.ENOENT):
788 789 match.bad(self.pathto(nd), inst.strerror)
789 790 continue
790 791 raise
791 792 for f, kind, st in entries:
792 793 if normalizefile:
793 794 # even though f might be a directory, we're only
794 795 # interested in comparing it to files currently in the
795 796 # dmap -- therefore normalizefile is enough
796 797 nf = normalizefile(nd and (nd + "/" + f) or f, True,
797 798 True)
798 799 else:
799 800 nf = nd and (nd + "/" + f) or f
800 801 if nf not in results:
801 802 if kind == dirkind:
802 803 if not ignore(nf):
803 804 if matchtdir:
804 805 matchtdir(nf)
805 806 wadd(nf)
806 807 if nf in dmap and (matchalways or matchfn(nf)):
807 808 results[nf] = None
808 809 elif kind == regkind or kind == lnkkind:
809 810 if nf in dmap:
810 811 if matchalways or matchfn(nf):
811 812 results[nf] = st
812 813 elif ((matchalways or matchfn(nf))
813 814 and not ignore(nf)):
814 815 # unknown file -- normalize if necessary
815 816 if not alreadynormed:
816 817 nf = normalize(nf, False, True)
817 818 results[nf] = st
818 819 elif nf in dmap and (matchalways or matchfn(nf)):
819 820 results[nf] = None
820 821
821 822 for nd, d in work:
822 823 # alreadynormed means that processwork doesn't have to do any
823 824 # expensive directory normalization
824 825 alreadynormed = not normalize or nd == d
825 826 traverse([d], alreadynormed)
826 827
827 828 for s in subrepos:
828 829 del results[s]
829 830 del results['.hg']
830 831
831 832 # step 3: visit remaining files from dmap
832 833 if not skipstep3 and not exact:
833 834 # If a dmap file is not in results yet, it was either
834 835 # a) not matching matchfn b) ignored, c) missing, or d) under a
835 836 # symlink directory.
836 837 if not results and matchalways:
837 838 visit = dmap.keys()
838 839 else:
839 840 visit = [f for f in dmap if f not in results and matchfn(f)]
840 841 visit.sort()
841 842
842 843 if unknown:
843 844 # unknown == True means we walked all dirs under the roots
844 845 # that wasn't ignored, and everything that matched was stat'ed
845 846 # and is already in results.
846 847 # The rest must thus be ignored or under a symlink.
847 848 audit_path = pathutil.pathauditor(self._root)
848 849
849 850 for nf in iter(visit):
850 851 # If a stat for the same file was already added with a
851 852 # different case, don't add one for this, since that would
852 853 # make it appear as if the file exists under both names
853 854 # on disk.
854 855 if (normalizefile and
855 856 normalizefile(nf, True, True) in results):
856 857 results[nf] = None
857 858 # Report ignored items in the dmap as long as they are not
858 859 # under a symlink directory.
859 860 elif audit_path.check(nf):
860 861 try:
861 862 results[nf] = lstat(join(nf))
862 863 # file was just ignored, no links, and exists
863 864 except OSError:
864 865 # file doesn't exist
865 866 results[nf] = None
866 867 else:
867 868 # It's either missing or under a symlink directory
868 869 # which we in this case report as missing
869 870 results[nf] = None
870 871 else:
871 872 # We may not have walked the full directory tree above,
872 873 # so stat and check everything we missed.
873 874 nf = iter(visit).next
874 875 for st in util.statfiles([join(i) for i in visit]):
875 876 results[nf()] = st
876 877 return results
877 878
878 879 def status(self, match, subrepos, ignored, clean, unknown):
879 880 '''Determine the status of the working copy relative to the
880 881 dirstate and return a pair of (unsure, status), where status is of type
881 882 scmutil.status and:
882 883
883 884 unsure:
884 885 files that might have been modified since the dirstate was
885 886 written, but need to be read to be sure (size is the same
886 887 but mtime differs)
887 888 status.modified:
888 889 files that have definitely been modified since the dirstate
889 890 was written (different size or mode)
890 891 status.clean:
891 892 files that have definitely not been modified since the
892 893 dirstate was written
893 894 '''
894 895 listignored, listclean, listunknown = ignored, clean, unknown
895 896 lookup, modified, added, unknown, ignored = [], [], [], [], []
896 897 removed, deleted, clean = [], [], []
897 898
898 899 dmap = self._map
899 900 ladd = lookup.append # aka "unsure"
900 901 madd = modified.append
901 902 aadd = added.append
902 903 uadd = unknown.append
903 904 iadd = ignored.append
904 905 radd = removed.append
905 906 dadd = deleted.append
906 907 cadd = clean.append
907 908 mexact = match.exact
908 909 dirignore = self._dirignore
909 910 checkexec = self._checkexec
910 911 copymap = self._copymap
911 912 lastnormaltime = self._lastnormaltime
912 913
913 914 # We need to do full walks when either
914 915 # - we're listing all clean files, or
915 916 # - match.traversedir does something, because match.traversedir should
916 917 # be called for every dir in the working dir
917 918 full = listclean or match.traversedir is not None
918 919 for fn, st in self.walk(match, subrepos, listunknown, listignored,
919 920 full=full).iteritems():
920 921 if fn not in dmap:
921 922 if (listignored or mexact(fn)) and dirignore(fn):
922 923 if listignored:
923 924 iadd(fn)
924 925 else:
925 926 uadd(fn)
926 927 continue
927 928
928 929 # This is equivalent to 'state, mode, size, time = dmap[fn]' but not
929 930 # written like that for performance reasons. dmap[fn] is not a
930 931 # Python tuple in compiled builds. The CPython UNPACK_SEQUENCE
931 932 # opcode has fast paths when the value to be unpacked is a tuple or
932 933 # a list, but falls back to creating a full-fledged iterator in
933 934 # general. That is much slower than simply accessing and storing the
934 935 # tuple members one by one.
935 936 t = dmap[fn]
936 937 state = t[0]
937 938 mode = t[1]
938 939 size = t[2]
939 940 time = t[3]
940 941
941 942 if not st and state in "nma":
942 943 dadd(fn)
943 944 elif state == 'n':
944 945 mtime = int(st.st_mtime)
945 946 if (size >= 0 and
946 947 ((size != st.st_size and size != st.st_size & _rangemask)
947 948 or ((mode ^ st.st_mode) & 0100 and checkexec))
948 949 or size == -2 # other parent
949 950 or fn in copymap):
950 951 madd(fn)
951 952 elif time != mtime and time != mtime & _rangemask:
952 953 ladd(fn)
953 954 elif mtime == lastnormaltime:
954 955 # fn may have just been marked as normal and it may have
955 956 # changed in the same second without changing its size.
956 957 # This can happen if we quickly do multiple commits.
957 958 # Force lookup, so we don't miss such a racy file change.
958 959 ladd(fn)
959 960 elif listclean:
960 961 cadd(fn)
961 962 elif state == 'm':
962 963 madd(fn)
963 964 elif state == 'a':
964 965 aadd(fn)
965 966 elif state == 'r':
966 967 radd(fn)
967 968
968 969 return (lookup, scmutil.status(modified, added, removed, deleted,
969 970 unknown, ignored, clean))
970 971
971 972 def matches(self, match):
972 973 '''
973 974 return files in the dirstate (in whatever state) filtered by match
974 975 '''
975 976 dmap = self._map
976 977 if match.always():
977 978 return dmap.keys()
978 979 files = match.files()
979 980 if match.isexact():
980 981 # fast path -- filter the other way around, since typically files is
981 982 # much smaller than dmap
982 983 return [f for f in files if f in dmap]
983 984 if not match.anypats() and all(fn in dmap for fn in files):
984 985 # fast path -- all the values are known to be files, so just return
985 986 # that
986 987 return list(files)
987 988 return [f for f in dmap if match(f)]
General Comments 0
You need to be logged in to leave comments. Login now