##// END OF EJS Templates
changegroupsubset: simplify parents pruning
Benoit Boissinot -
r10010:2fce9691 default
parent child Browse files
Show More
@@ -1,2175 +1,2165
1 1 # localrepo.py - read/write repository class for mercurial
2 2 #
3 3 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms of the
6 6 # GNU General Public License version 2, incorporated herein by reference.
7 7
8 8 from node import bin, hex, nullid, nullrev, short
9 9 from i18n import _
10 10 import repo, changegroup, subrepo
11 11 import changelog, dirstate, filelog, manifest, context
12 12 import lock, transaction, store, encoding
13 13 import util, extensions, hook, error
14 14 import match as match_
15 15 import merge as merge_
16 16 import tags as tags_
17 17 from lock import release
18 18 import weakref, stat, errno, os, time, inspect
19 19 propertycache = util.propertycache
20 20
21 21 class localrepository(repo.repository):
22 22 capabilities = set(('lookup', 'changegroupsubset', 'branchmap'))
23 23 supported = set('revlogv1 store fncache shared'.split())
24 24
25 25 def __init__(self, baseui, path=None, create=0):
26 26 repo.repository.__init__(self)
27 27 self.root = os.path.realpath(path)
28 28 self.path = os.path.join(self.root, ".hg")
29 29 self.origroot = path
30 30 self.opener = util.opener(self.path)
31 31 self.wopener = util.opener(self.root)
32 32 self.baseui = baseui
33 33 self.ui = baseui.copy()
34 34
35 35 try:
36 36 self.ui.readconfig(self.join("hgrc"), self.root)
37 37 extensions.loadall(self.ui)
38 38 except IOError:
39 39 pass
40 40
41 41 if not os.path.isdir(self.path):
42 42 if create:
43 43 if not os.path.exists(path):
44 44 os.mkdir(path)
45 45 os.mkdir(self.path)
46 46 requirements = ["revlogv1"]
47 47 if self.ui.configbool('format', 'usestore', True):
48 48 os.mkdir(os.path.join(self.path, "store"))
49 49 requirements.append("store")
50 50 if self.ui.configbool('format', 'usefncache', True):
51 51 requirements.append("fncache")
52 52 # create an invalid changelog
53 53 self.opener("00changelog.i", "a").write(
54 54 '\0\0\0\2' # represents revlogv2
55 55 ' dummy changelog to prevent using the old repo layout'
56 56 )
57 57 reqfile = self.opener("requires", "w")
58 58 for r in requirements:
59 59 reqfile.write("%s\n" % r)
60 60 reqfile.close()
61 61 else:
62 62 raise error.RepoError(_("repository %s not found") % path)
63 63 elif create:
64 64 raise error.RepoError(_("repository %s already exists") % path)
65 65 else:
66 66 # find requirements
67 67 requirements = set()
68 68 try:
69 69 requirements = set(self.opener("requires").read().splitlines())
70 70 except IOError, inst:
71 71 if inst.errno != errno.ENOENT:
72 72 raise
73 73 for r in requirements - self.supported:
74 74 raise error.RepoError(_("requirement '%s' not supported") % r)
75 75
76 76 self.sharedpath = self.path
77 77 try:
78 78 s = os.path.realpath(self.opener("sharedpath").read())
79 79 if not os.path.exists(s):
80 80 raise error.RepoError(
81 81 _('.hg/sharedpath points to nonexistent directory %s') % s)
82 82 self.sharedpath = s
83 83 except IOError, inst:
84 84 if inst.errno != errno.ENOENT:
85 85 raise
86 86
87 87 self.store = store.store(requirements, self.sharedpath, util.opener)
88 88 self.spath = self.store.path
89 89 self.sopener = self.store.opener
90 90 self.sjoin = self.store.join
91 91 self.opener.createmode = self.store.createmode
92 92
93 93 # These two define the set of tags for this repository. _tags
94 94 # maps tag name to node; _tagtypes maps tag name to 'global' or
95 95 # 'local'. (Global tags are defined by .hgtags across all
96 96 # heads, and local tags are defined in .hg/localtags.) They
97 97 # constitute the in-memory cache of tags.
98 98 self._tags = None
99 99 self._tagtypes = None
100 100
101 101 self._branchcache = None # in UTF-8
102 102 self._branchcachetip = None
103 103 self.nodetagscache = None
104 104 self.filterpats = {}
105 105 self._datafilters = {}
106 106 self._transref = self._lockref = self._wlockref = None
107 107
108 108 @propertycache
109 109 def changelog(self):
110 110 c = changelog.changelog(self.sopener)
111 111 if 'HG_PENDING' in os.environ:
112 112 p = os.environ['HG_PENDING']
113 113 if p.startswith(self.root):
114 114 c.readpending('00changelog.i.a')
115 115 self.sopener.defversion = c.version
116 116 return c
117 117
118 118 @propertycache
119 119 def manifest(self):
120 120 return manifest.manifest(self.sopener)
121 121
122 122 @propertycache
123 123 def dirstate(self):
124 124 return dirstate.dirstate(self.opener, self.ui, self.root)
125 125
126 126 def __getitem__(self, changeid):
127 127 if changeid is None:
128 128 return context.workingctx(self)
129 129 return context.changectx(self, changeid)
130 130
131 131 def __contains__(self, changeid):
132 132 try:
133 133 return bool(self.lookup(changeid))
134 134 except error.RepoLookupError:
135 135 return False
136 136
137 137 def __nonzero__(self):
138 138 return True
139 139
140 140 def __len__(self):
141 141 return len(self.changelog)
142 142
143 143 def __iter__(self):
144 144 for i in xrange(len(self)):
145 145 yield i
146 146
147 147 def url(self):
148 148 return 'file:' + self.root
149 149
150 150 def hook(self, name, throw=False, **args):
151 151 return hook.hook(self.ui, self, name, throw, **args)
152 152
153 153 tag_disallowed = ':\r\n'
154 154
155 155 def _tag(self, names, node, message, local, user, date, extra={}):
156 156 if isinstance(names, str):
157 157 allchars = names
158 158 names = (names,)
159 159 else:
160 160 allchars = ''.join(names)
161 161 for c in self.tag_disallowed:
162 162 if c in allchars:
163 163 raise util.Abort(_('%r cannot be used in a tag name') % c)
164 164
165 165 for name in names:
166 166 self.hook('pretag', throw=True, node=hex(node), tag=name,
167 167 local=local)
168 168
169 169 def writetags(fp, names, munge, prevtags):
170 170 fp.seek(0, 2)
171 171 if prevtags and prevtags[-1] != '\n':
172 172 fp.write('\n')
173 173 for name in names:
174 174 m = munge and munge(name) or name
175 175 if self._tagtypes and name in self._tagtypes:
176 176 old = self._tags.get(name, nullid)
177 177 fp.write('%s %s\n' % (hex(old), m))
178 178 fp.write('%s %s\n' % (hex(node), m))
179 179 fp.close()
180 180
181 181 prevtags = ''
182 182 if local:
183 183 try:
184 184 fp = self.opener('localtags', 'r+')
185 185 except IOError:
186 186 fp = self.opener('localtags', 'a')
187 187 else:
188 188 prevtags = fp.read()
189 189
190 190 # local tags are stored in the current charset
191 191 writetags(fp, names, None, prevtags)
192 192 for name in names:
193 193 self.hook('tag', node=hex(node), tag=name, local=local)
194 194 return
195 195
196 196 try:
197 197 fp = self.wfile('.hgtags', 'rb+')
198 198 except IOError:
199 199 fp = self.wfile('.hgtags', 'ab')
200 200 else:
201 201 prevtags = fp.read()
202 202
203 203 # committed tags are stored in UTF-8
204 204 writetags(fp, names, encoding.fromlocal, prevtags)
205 205
206 206 if '.hgtags' not in self.dirstate:
207 207 self.add(['.hgtags'])
208 208
209 209 m = match_.exact(self.root, '', ['.hgtags'])
210 210 tagnode = self.commit(message, user, date, extra=extra, match=m)
211 211
212 212 for name in names:
213 213 self.hook('tag', node=hex(node), tag=name, local=local)
214 214
215 215 return tagnode
216 216
217 217 def tag(self, names, node, message, local, user, date):
218 218 '''tag a revision with one or more symbolic names.
219 219
220 220 names is a list of strings or, when adding a single tag, names may be a
221 221 string.
222 222
223 223 if local is True, the tags are stored in a per-repository file.
224 224 otherwise, they are stored in the .hgtags file, and a new
225 225 changeset is committed with the change.
226 226
227 227 keyword arguments:
228 228
229 229 local: whether to store tags in non-version-controlled file
230 230 (default False)
231 231
232 232 message: commit message to use if committing
233 233
234 234 user: name of user to use if committing
235 235
236 236 date: date tuple to use if committing'''
237 237
238 238 for x in self.status()[:5]:
239 239 if '.hgtags' in x:
240 240 raise util.Abort(_('working copy of .hgtags is changed '
241 241 '(please commit .hgtags manually)'))
242 242
243 243 self.tags() # instantiate the cache
244 244 self._tag(names, node, message, local, user, date)
245 245
246 246 def tags(self):
247 247 '''return a mapping of tag to node'''
248 248 if self._tags is None:
249 249 (self._tags, self._tagtypes) = self._findtags()
250 250
251 251 return self._tags
252 252
253 253 def _findtags(self):
254 254 '''Do the hard work of finding tags. Return a pair of dicts
255 255 (tags, tagtypes) where tags maps tag name to node, and tagtypes
256 256 maps tag name to a string like \'global\' or \'local\'.
257 257 Subclasses or extensions are free to add their own tags, but
258 258 should be aware that the returned dicts will be retained for the
259 259 duration of the localrepo object.'''
260 260
261 261 # XXX what tagtype should subclasses/extensions use? Currently
262 262 # mq and bookmarks add tags, but do not set the tagtype at all.
263 263 # Should each extension invent its own tag type? Should there
264 264 # be one tagtype for all such "virtual" tags? Or is the status
265 265 # quo fine?
266 266
267 267 alltags = {} # map tag name to (node, hist)
268 268 tagtypes = {}
269 269
270 270 tags_.findglobaltags(self.ui, self, alltags, tagtypes)
271 271 tags_.readlocaltags(self.ui, self, alltags, tagtypes)
272 272
273 273 # Build the return dicts. Have to re-encode tag names because
274 274 # the tags module always uses UTF-8 (in order not to lose info
275 275 # writing to the cache), but the rest of Mercurial wants them in
276 276 # local encoding.
277 277 tags = {}
278 278 for (name, (node, hist)) in alltags.iteritems():
279 279 if node != nullid:
280 280 tags[encoding.tolocal(name)] = node
281 281 tags['tip'] = self.changelog.tip()
282 282 tagtypes = dict([(encoding.tolocal(name), value)
283 283 for (name, value) in tagtypes.iteritems()])
284 284 return (tags, tagtypes)
285 285
286 286 def tagtype(self, tagname):
287 287 '''
288 288 return the type of the given tag. result can be:
289 289
290 290 'local' : a local tag
291 291 'global' : a global tag
292 292 None : tag does not exist
293 293 '''
294 294
295 295 self.tags()
296 296
297 297 return self._tagtypes.get(tagname)
298 298
299 299 def tagslist(self):
300 300 '''return a list of tags ordered by revision'''
301 301 l = []
302 302 for t, n in self.tags().iteritems():
303 303 try:
304 304 r = self.changelog.rev(n)
305 305 except:
306 306 r = -2 # sort to the beginning of the list if unknown
307 307 l.append((r, t, n))
308 308 return [(t, n) for r, t, n in sorted(l)]
309 309
310 310 def nodetags(self, node):
311 311 '''return the tags associated with a node'''
312 312 if not self.nodetagscache:
313 313 self.nodetagscache = {}
314 314 for t, n in self.tags().iteritems():
315 315 self.nodetagscache.setdefault(n, []).append(t)
316 316 return self.nodetagscache.get(node, [])
317 317
318 318 def _branchtags(self, partial, lrev):
319 319 # TODO: rename this function?
320 320 tiprev = len(self) - 1
321 321 if lrev != tiprev:
322 322 self._updatebranchcache(partial, lrev+1, tiprev+1)
323 323 self._writebranchcache(partial, self.changelog.tip(), tiprev)
324 324
325 325 return partial
326 326
327 327 def branchmap(self):
328 328 tip = self.changelog.tip()
329 329 if self._branchcache is not None and self._branchcachetip == tip:
330 330 return self._branchcache
331 331
332 332 oldtip = self._branchcachetip
333 333 self._branchcachetip = tip
334 334 if oldtip is None or oldtip not in self.changelog.nodemap:
335 335 partial, last, lrev = self._readbranchcache()
336 336 else:
337 337 lrev = self.changelog.rev(oldtip)
338 338 partial = self._branchcache
339 339
340 340 self._branchtags(partial, lrev)
341 341 # this private cache holds all heads (not just tips)
342 342 self._branchcache = partial
343 343
344 344 return self._branchcache
345 345
346 346 def branchtags(self):
347 347 '''return a dict where branch names map to the tipmost head of
348 348 the branch, open heads come before closed'''
349 349 bt = {}
350 350 for bn, heads in self.branchmap().iteritems():
351 351 head = None
352 352 for i in range(len(heads)-1, -1, -1):
353 353 h = heads[i]
354 354 if 'close' not in self.changelog.read(h)[5]:
355 355 head = h
356 356 break
357 357 # no open heads were found
358 358 if head is None:
359 359 head = heads[-1]
360 360 bt[bn] = head
361 361 return bt
362 362
363 363
364 364 def _readbranchcache(self):
365 365 partial = {}
366 366 try:
367 367 f = self.opener("branchheads.cache")
368 368 lines = f.read().split('\n')
369 369 f.close()
370 370 except (IOError, OSError):
371 371 return {}, nullid, nullrev
372 372
373 373 try:
374 374 last, lrev = lines.pop(0).split(" ", 1)
375 375 last, lrev = bin(last), int(lrev)
376 376 if lrev >= len(self) or self[lrev].node() != last:
377 377 # invalidate the cache
378 378 raise ValueError('invalidating branch cache (tip differs)')
379 379 for l in lines:
380 380 if not l: continue
381 381 node, label = l.split(" ", 1)
382 382 partial.setdefault(label.strip(), []).append(bin(node))
383 383 except KeyboardInterrupt:
384 384 raise
385 385 except Exception, inst:
386 386 if self.ui.debugflag:
387 387 self.ui.warn(str(inst), '\n')
388 388 partial, last, lrev = {}, nullid, nullrev
389 389 return partial, last, lrev
390 390
391 391 def _writebranchcache(self, branches, tip, tiprev):
392 392 try:
393 393 f = self.opener("branchheads.cache", "w", atomictemp=True)
394 394 f.write("%s %s\n" % (hex(tip), tiprev))
395 395 for label, nodes in branches.iteritems():
396 396 for node in nodes:
397 397 f.write("%s %s\n" % (hex(node), label))
398 398 f.rename()
399 399 except (IOError, OSError):
400 400 pass
401 401
402 402 def _updatebranchcache(self, partial, start, end):
403 403 # collect new branch entries
404 404 newbranches = {}
405 405 for r in xrange(start, end):
406 406 c = self[r]
407 407 newbranches.setdefault(c.branch(), []).append(c.node())
408 408 # if older branchheads are reachable from new ones, they aren't
409 409 # really branchheads. Note checking parents is insufficient:
410 410 # 1 (branch a) -> 2 (branch b) -> 3 (branch a)
411 411 for branch, newnodes in newbranches.iteritems():
412 412 bheads = partial.setdefault(branch, [])
413 413 bheads.extend(newnodes)
414 414 if len(bheads) < 2:
415 415 continue
416 416 newbheads = []
417 417 # starting from tip means fewer passes over reachable
418 418 while newnodes:
419 419 latest = newnodes.pop()
420 420 if latest not in bheads:
421 421 continue
422 422 minbhrev = self[min([self[bh].rev() for bh in bheads])].node()
423 423 reachable = self.changelog.reachable(latest, minbhrev)
424 424 bheads = [b for b in bheads if b not in reachable]
425 425 newbheads.insert(0, latest)
426 426 bheads.extend(newbheads)
427 427 partial[branch] = bheads
428 428
429 429 def lookup(self, key):
430 430 if isinstance(key, int):
431 431 return self.changelog.node(key)
432 432 elif key == '.':
433 433 return self.dirstate.parents()[0]
434 434 elif key == 'null':
435 435 return nullid
436 436 elif key == 'tip':
437 437 return self.changelog.tip()
438 438 n = self.changelog._match(key)
439 439 if n:
440 440 return n
441 441 if key in self.tags():
442 442 return self.tags()[key]
443 443 if key in self.branchtags():
444 444 return self.branchtags()[key]
445 445 n = self.changelog._partialmatch(key)
446 446 if n:
447 447 return n
448 448
449 449 # can't find key, check if it might have come from damaged dirstate
450 450 if key in self.dirstate.parents():
451 451 raise error.Abort(_("working directory has unknown parent '%s'!")
452 452 % short(key))
453 453 try:
454 454 if len(key) == 20:
455 455 key = hex(key)
456 456 except:
457 457 pass
458 458 raise error.RepoLookupError(_("unknown revision '%s'") % key)
459 459
460 460 def local(self):
461 461 return True
462 462
463 463 def join(self, f):
464 464 return os.path.join(self.path, f)
465 465
466 466 def wjoin(self, f):
467 467 return os.path.join(self.root, f)
468 468
469 469 def rjoin(self, f):
470 470 return os.path.join(self.root, util.pconvert(f))
471 471
472 472 def file(self, f):
473 473 if f[0] == '/':
474 474 f = f[1:]
475 475 return filelog.filelog(self.sopener, f)
476 476
477 477 def changectx(self, changeid):
478 478 return self[changeid]
479 479
480 480 def parents(self, changeid=None):
481 481 '''get list of changectxs for parents of changeid'''
482 482 return self[changeid].parents()
483 483
484 484 def filectx(self, path, changeid=None, fileid=None):
485 485 """changeid can be a changeset revision, node, or tag.
486 486 fileid can be a file revision or node."""
487 487 return context.filectx(self, path, changeid, fileid)
488 488
489 489 def getcwd(self):
490 490 return self.dirstate.getcwd()
491 491
492 492 def pathto(self, f, cwd=None):
493 493 return self.dirstate.pathto(f, cwd)
494 494
495 495 def wfile(self, f, mode='r'):
496 496 return self.wopener(f, mode)
497 497
498 498 def _link(self, f):
499 499 return os.path.islink(self.wjoin(f))
500 500
501 501 def _filter(self, filter, filename, data):
502 502 if filter not in self.filterpats:
503 503 l = []
504 504 for pat, cmd in self.ui.configitems(filter):
505 505 if cmd == '!':
506 506 continue
507 507 mf = match_.match(self.root, '', [pat])
508 508 fn = None
509 509 params = cmd
510 510 for name, filterfn in self._datafilters.iteritems():
511 511 if cmd.startswith(name):
512 512 fn = filterfn
513 513 params = cmd[len(name):].lstrip()
514 514 break
515 515 if not fn:
516 516 fn = lambda s, c, **kwargs: util.filter(s, c)
517 517 # Wrap old filters not supporting keyword arguments
518 518 if not inspect.getargspec(fn)[2]:
519 519 oldfn = fn
520 520 fn = lambda s, c, **kwargs: oldfn(s, c)
521 521 l.append((mf, fn, params))
522 522 self.filterpats[filter] = l
523 523
524 524 for mf, fn, cmd in self.filterpats[filter]:
525 525 if mf(filename):
526 526 self.ui.debug("filtering %s through %s\n" % (filename, cmd))
527 527 data = fn(data, cmd, ui=self.ui, repo=self, filename=filename)
528 528 break
529 529
530 530 return data
531 531
532 532 def adddatafilter(self, name, filter):
533 533 self._datafilters[name] = filter
534 534
535 535 def wread(self, filename):
536 536 if self._link(filename):
537 537 data = os.readlink(self.wjoin(filename))
538 538 else:
539 539 data = self.wopener(filename, 'r').read()
540 540 return self._filter("encode", filename, data)
541 541
542 542 def wwrite(self, filename, data, flags):
543 543 data = self._filter("decode", filename, data)
544 544 try:
545 545 os.unlink(self.wjoin(filename))
546 546 except OSError:
547 547 pass
548 548 if 'l' in flags:
549 549 self.wopener.symlink(data, filename)
550 550 else:
551 551 self.wopener(filename, 'w').write(data)
552 552 if 'x' in flags:
553 553 util.set_flags(self.wjoin(filename), False, True)
554 554
555 555 def wwritedata(self, filename, data):
556 556 return self._filter("decode", filename, data)
557 557
558 558 def transaction(self):
559 559 tr = self._transref and self._transref() or None
560 560 if tr and tr.running():
561 561 return tr.nest()
562 562
563 563 # abort here if the journal already exists
564 564 if os.path.exists(self.sjoin("journal")):
565 565 raise error.RepoError(_("abandoned transaction found - run hg recover"))
566 566
567 567 # save dirstate for rollback
568 568 try:
569 569 ds = self.opener("dirstate").read()
570 570 except IOError:
571 571 ds = ""
572 572 self.opener("journal.dirstate", "w").write(ds)
573 573 self.opener("journal.branch", "w").write(self.dirstate.branch())
574 574
575 575 renames = [(self.sjoin("journal"), self.sjoin("undo")),
576 576 (self.join("journal.dirstate"), self.join("undo.dirstate")),
577 577 (self.join("journal.branch"), self.join("undo.branch"))]
578 578 tr = transaction.transaction(self.ui.warn, self.sopener,
579 579 self.sjoin("journal"),
580 580 aftertrans(renames),
581 581 self.store.createmode)
582 582 self._transref = weakref.ref(tr)
583 583 return tr
584 584
585 585 def recover(self):
586 586 lock = self.lock()
587 587 try:
588 588 if os.path.exists(self.sjoin("journal")):
589 589 self.ui.status(_("rolling back interrupted transaction\n"))
590 590 transaction.rollback(self.sopener, self.sjoin("journal"), self.ui.warn)
591 591 self.invalidate()
592 592 return True
593 593 else:
594 594 self.ui.warn(_("no interrupted transaction available\n"))
595 595 return False
596 596 finally:
597 597 lock.release()
598 598
599 599 def rollback(self):
600 600 wlock = lock = None
601 601 try:
602 602 wlock = self.wlock()
603 603 lock = self.lock()
604 604 if os.path.exists(self.sjoin("undo")):
605 605 self.ui.status(_("rolling back last transaction\n"))
606 606 transaction.rollback(self.sopener, self.sjoin("undo"), self.ui.warn)
607 607 util.rename(self.join("undo.dirstate"), self.join("dirstate"))
608 608 try:
609 609 branch = self.opener("undo.branch").read()
610 610 self.dirstate.setbranch(branch)
611 611 except IOError:
612 612 self.ui.warn(_("Named branch could not be reset, "
613 613 "current branch still is: %s\n")
614 614 % encoding.tolocal(self.dirstate.branch()))
615 615 self.invalidate()
616 616 self.dirstate.invalidate()
617 617 self.destroyed()
618 618 else:
619 619 self.ui.warn(_("no rollback information available\n"))
620 620 finally:
621 621 release(lock, wlock)
622 622
623 623 def invalidate(self):
624 624 for a in "changelog manifest".split():
625 625 if a in self.__dict__:
626 626 delattr(self, a)
627 627 self._tags = None
628 628 self._tagtypes = None
629 629 self.nodetagscache = None
630 630 self._branchcache = None # in UTF-8
631 631 self._branchcachetip = None
632 632
633 633 def _lock(self, lockname, wait, releasefn, acquirefn, desc):
634 634 try:
635 635 l = lock.lock(lockname, 0, releasefn, desc=desc)
636 636 except error.LockHeld, inst:
637 637 if not wait:
638 638 raise
639 639 self.ui.warn(_("waiting for lock on %s held by %r\n") %
640 640 (desc, inst.locker))
641 641 # default to 600 seconds timeout
642 642 l = lock.lock(lockname, int(self.ui.config("ui", "timeout", "600")),
643 643 releasefn, desc=desc)
644 644 if acquirefn:
645 645 acquirefn()
646 646 return l
647 647
648 648 def lock(self, wait=True):
649 649 '''Lock the repository store (.hg/store) and return a weak reference
650 650 to the lock. Use this before modifying the store (e.g. committing or
651 651 stripping). If you are opening a transaction, get a lock as well.)'''
652 652 l = self._lockref and self._lockref()
653 653 if l is not None and l.held:
654 654 l.lock()
655 655 return l
656 656
657 657 l = self._lock(self.sjoin("lock"), wait, None, self.invalidate,
658 658 _('repository %s') % self.origroot)
659 659 self._lockref = weakref.ref(l)
660 660 return l
661 661
662 662 def wlock(self, wait=True):
663 663 '''Lock the non-store parts of the repository (everything under
664 664 .hg except .hg/store) and return a weak reference to the lock.
665 665 Use this before modifying files in .hg.'''
666 666 l = self._wlockref and self._wlockref()
667 667 if l is not None and l.held:
668 668 l.lock()
669 669 return l
670 670
671 671 l = self._lock(self.join("wlock"), wait, self.dirstate.write,
672 672 self.dirstate.invalidate, _('working directory of %s') %
673 673 self.origroot)
674 674 self._wlockref = weakref.ref(l)
675 675 return l
676 676
677 677 def _filecommit(self, fctx, manifest1, manifest2, linkrev, tr, changelist):
678 678 """
679 679 commit an individual file as part of a larger transaction
680 680 """
681 681
682 682 fname = fctx.path()
683 683 text = fctx.data()
684 684 flog = self.file(fname)
685 685 fparent1 = manifest1.get(fname, nullid)
686 686 fparent2 = fparent2o = manifest2.get(fname, nullid)
687 687
688 688 meta = {}
689 689 copy = fctx.renamed()
690 690 if copy and copy[0] != fname:
691 691 # Mark the new revision of this file as a copy of another
692 692 # file. This copy data will effectively act as a parent
693 693 # of this new revision. If this is a merge, the first
694 694 # parent will be the nullid (meaning "look up the copy data")
695 695 # and the second one will be the other parent. For example:
696 696 #
697 697 # 0 --- 1 --- 3 rev1 changes file foo
698 698 # \ / rev2 renames foo to bar and changes it
699 699 # \- 2 -/ rev3 should have bar with all changes and
700 700 # should record that bar descends from
701 701 # bar in rev2 and foo in rev1
702 702 #
703 703 # this allows this merge to succeed:
704 704 #
705 705 # 0 --- 1 --- 3 rev4 reverts the content change from rev2
706 706 # \ / merging rev3 and rev4 should use bar@rev2
707 707 # \- 2 --- 4 as the merge base
708 708 #
709 709
710 710 cfname = copy[0]
711 711 crev = manifest1.get(cfname)
712 712 newfparent = fparent2
713 713
714 714 if manifest2: # branch merge
715 715 if fparent2 == nullid or crev is None: # copied on remote side
716 716 if cfname in manifest2:
717 717 crev = manifest2[cfname]
718 718 newfparent = fparent1
719 719
720 720 # find source in nearest ancestor if we've lost track
721 721 if not crev:
722 722 self.ui.debug(" %s: searching for copy revision for %s\n" %
723 723 (fname, cfname))
724 724 for ancestor in self['.'].ancestors():
725 725 if cfname in ancestor:
726 726 crev = ancestor[cfname].filenode()
727 727 break
728 728
729 729 self.ui.debug(" %s: copy %s:%s\n" % (fname, cfname, hex(crev)))
730 730 meta["copy"] = cfname
731 731 meta["copyrev"] = hex(crev)
732 732 fparent1, fparent2 = nullid, newfparent
733 733 elif fparent2 != nullid:
734 734 # is one parent an ancestor of the other?
735 735 fparentancestor = flog.ancestor(fparent1, fparent2)
736 736 if fparentancestor == fparent1:
737 737 fparent1, fparent2 = fparent2, nullid
738 738 elif fparentancestor == fparent2:
739 739 fparent2 = nullid
740 740
741 741 # is the file changed?
742 742 if fparent2 != nullid or flog.cmp(fparent1, text) or meta:
743 743 changelist.append(fname)
744 744 return flog.add(text, meta, tr, linkrev, fparent1, fparent2)
745 745
746 746 # are just the flags changed during merge?
747 747 if fparent1 != fparent2o and manifest1.flags(fname) != fctx.flags():
748 748 changelist.append(fname)
749 749
750 750 return fparent1
751 751
752 752 def commit(self, text="", user=None, date=None, match=None, force=False,
753 753 editor=False, extra={}):
754 754 """Add a new revision to current repository.
755 755
756 756 Revision information is gathered from the working directory,
757 757 match can be used to filter the committed files. If editor is
758 758 supplied, it is called to get a commit message.
759 759 """
760 760
761 761 def fail(f, msg):
762 762 raise util.Abort('%s: %s' % (f, msg))
763 763
764 764 if not match:
765 765 match = match_.always(self.root, '')
766 766
767 767 if not force:
768 768 vdirs = []
769 769 match.dir = vdirs.append
770 770 match.bad = fail
771 771
772 772 wlock = self.wlock()
773 773 try:
774 774 p1, p2 = self.dirstate.parents()
775 775 wctx = self[None]
776 776
777 777 if (not force and p2 != nullid and match and
778 778 (match.files() or match.anypats())):
779 779 raise util.Abort(_('cannot partially commit a merge '
780 780 '(do not specify files or patterns)'))
781 781
782 782 changes = self.status(match=match, clean=force)
783 783 if force:
784 784 changes[0].extend(changes[6]) # mq may commit unchanged files
785 785
786 786 # check subrepos
787 787 subs = []
788 788 for s in wctx.substate:
789 789 if match(s) and wctx.sub(s).dirty():
790 790 subs.append(s)
791 791 if subs and '.hgsubstate' not in changes[0]:
792 792 changes[0].insert(0, '.hgsubstate')
793 793
794 794 # make sure all explicit patterns are matched
795 795 if not force and match.files():
796 796 matched = set(changes[0] + changes[1] + changes[2])
797 797
798 798 for f in match.files():
799 799 if f == '.' or f in matched or f in wctx.substate:
800 800 continue
801 801 if f in changes[3]: # missing
802 802 fail(f, _('file not found!'))
803 803 if f in vdirs: # visited directory
804 804 d = f + '/'
805 805 for mf in matched:
806 806 if mf.startswith(d):
807 807 break
808 808 else:
809 809 fail(f, _("no match under directory!"))
810 810 elif f not in self.dirstate:
811 811 fail(f, _("file not tracked!"))
812 812
813 813 if (not force and not extra.get("close") and p2 == nullid
814 814 and not (changes[0] or changes[1] or changes[2])
815 815 and self[None].branch() == self['.'].branch()):
816 816 return None
817 817
818 818 ms = merge_.mergestate(self)
819 819 for f in changes[0]:
820 820 if f in ms and ms[f] == 'u':
821 821 raise util.Abort(_("unresolved merge conflicts "
822 822 "(see hg resolve)"))
823 823
824 824 cctx = context.workingctx(self, (p1, p2), text, user, date,
825 825 extra, changes)
826 826 if editor:
827 827 cctx._text = editor(self, cctx, subs)
828 828 edited = (text != cctx._text)
829 829
830 830 # commit subs
831 831 if subs:
832 832 state = wctx.substate.copy()
833 833 for s in subs:
834 834 self.ui.status(_('committing subrepository %s\n') % s)
835 835 sr = wctx.sub(s).commit(cctx._text, user, date)
836 836 state[s] = (state[s][0], sr)
837 837 subrepo.writestate(self, state)
838 838
839 839 # Save commit message in case this transaction gets rolled back
840 840 # (e.g. by a pretxncommit hook). Leave the content alone on
841 841 # the assumption that the user will use the same editor again.
842 842 msgfile = self.opener('last-message.txt', 'wb')
843 843 msgfile.write(cctx._text)
844 844 msgfile.close()
845 845
846 846 try:
847 847 ret = self.commitctx(cctx, True)
848 848 except:
849 849 if edited:
850 850 msgfn = self.pathto(msgfile.name[len(self.root)+1:])
851 851 self.ui.write(
852 852 _('note: commit message saved in %s\n') % msgfn)
853 853 raise
854 854
855 855 # update dirstate and mergestate
856 856 for f in changes[0] + changes[1]:
857 857 self.dirstate.normal(f)
858 858 for f in changes[2]:
859 859 self.dirstate.forget(f)
860 860 self.dirstate.setparents(ret)
861 861 ms.reset()
862 862
863 863 return ret
864 864
865 865 finally:
866 866 wlock.release()
867 867
868 868 def commitctx(self, ctx, error=False):
869 869 """Add a new revision to current repository.
870 870
871 871 Revision information is passed via the context argument.
872 872 """
873 873
874 874 tr = lock = None
875 875 removed = ctx.removed()
876 876 p1, p2 = ctx.p1(), ctx.p2()
877 877 m1 = p1.manifest().copy()
878 878 m2 = p2.manifest()
879 879 user = ctx.user()
880 880
881 881 xp1, xp2 = p1.hex(), p2 and p2.hex() or ''
882 882 self.hook("precommit", throw=True, parent1=xp1, parent2=xp2)
883 883
884 884 lock = self.lock()
885 885 try:
886 886 tr = self.transaction()
887 887 trp = weakref.proxy(tr)
888 888
889 889 # check in files
890 890 new = {}
891 891 changed = []
892 892 linkrev = len(self)
893 893 for f in sorted(ctx.modified() + ctx.added()):
894 894 self.ui.note(f + "\n")
895 895 try:
896 896 fctx = ctx[f]
897 897 new[f] = self._filecommit(fctx, m1, m2, linkrev, trp,
898 898 changed)
899 899 m1.set(f, fctx.flags())
900 900 except (OSError, IOError):
901 901 if error:
902 902 self.ui.warn(_("trouble committing %s!\n") % f)
903 903 raise
904 904 else:
905 905 removed.append(f)
906 906
907 907 # update manifest
908 908 m1.update(new)
909 909 removed = [f for f in sorted(removed) if f in m1 or f in m2]
910 910 drop = [f for f in removed if f in m1]
911 911 for f in drop:
912 912 del m1[f]
913 913 mn = self.manifest.add(m1, trp, linkrev, p1.manifestnode(),
914 914 p2.manifestnode(), (new, drop))
915 915
916 916 # update changelog
917 917 self.changelog.delayupdate()
918 918 n = self.changelog.add(mn, changed + removed, ctx.description(),
919 919 trp, p1.node(), p2.node(),
920 920 user, ctx.date(), ctx.extra().copy())
921 921 p = lambda: self.changelog.writepending() and self.root or ""
922 922 self.hook('pretxncommit', throw=True, node=hex(n), parent1=xp1,
923 923 parent2=xp2, pending=p)
924 924 self.changelog.finalize(trp)
925 925 tr.close()
926 926
927 927 if self._branchcache:
928 928 self.branchtags()
929 929
930 930 self.hook("commit", node=hex(n), parent1=xp1, parent2=xp2)
931 931 return n
932 932 finally:
933 933 del tr
934 934 lock.release()
935 935
936 936 def destroyed(self):
937 937 '''Inform the repository that nodes have been destroyed.
938 938 Intended for use by strip and rollback, so there's a common
939 939 place for anything that has to be done after destroying history.'''
940 940 # XXX it might be nice if we could take the list of destroyed
941 941 # nodes, but I don't see an easy way for rollback() to do that
942 942
943 943 # Ensure the persistent tag cache is updated. Doing it now
944 944 # means that the tag cache only has to worry about destroyed
945 945 # heads immediately after a strip/rollback. That in turn
946 946 # guarantees that "cachetip == currenttip" (comparing both rev
947 947 # and node) always means no nodes have been added or destroyed.
948 948
949 949 # XXX this is suboptimal when qrefresh'ing: we strip the current
950 950 # head, refresh the tag cache, then immediately add a new head.
951 951 # But I think doing it this way is necessary for the "instant
952 952 # tag cache retrieval" case to work.
953 953 tags_.findglobaltags(self.ui, self, {}, {})
954 954
955 955 def walk(self, match, node=None):
956 956 '''
957 957 walk recursively through the directory tree or a given
958 958 changeset, finding all files matched by the match
959 959 function
960 960 '''
961 961 return self[node].walk(match)
962 962
963 963 def status(self, node1='.', node2=None, match=None,
964 964 ignored=False, clean=False, unknown=False):
965 965 """return status of files between two nodes or node and working directory
966 966
967 967 If node1 is None, use the first dirstate parent instead.
968 968 If node2 is None, compare node1 with working directory.
969 969 """
970 970
971 971 def mfmatches(ctx):
972 972 mf = ctx.manifest().copy()
973 973 for fn in mf.keys():
974 974 if not match(fn):
975 975 del mf[fn]
976 976 return mf
977 977
978 978 if isinstance(node1, context.changectx):
979 979 ctx1 = node1
980 980 else:
981 981 ctx1 = self[node1]
982 982 if isinstance(node2, context.changectx):
983 983 ctx2 = node2
984 984 else:
985 985 ctx2 = self[node2]
986 986
987 987 working = ctx2.rev() is None
988 988 parentworking = working and ctx1 == self['.']
989 989 match = match or match_.always(self.root, self.getcwd())
990 990 listignored, listclean, listunknown = ignored, clean, unknown
991 991
992 992 # load earliest manifest first for caching reasons
993 993 if not working and ctx2.rev() < ctx1.rev():
994 994 ctx2.manifest()
995 995
996 996 if not parentworking:
997 997 def bad(f, msg):
998 998 if f not in ctx1:
999 999 self.ui.warn('%s: %s\n' % (self.dirstate.pathto(f), msg))
1000 1000 match.bad = bad
1001 1001
1002 1002 if working: # we need to scan the working dir
1003 1003 s = self.dirstate.status(match, listignored, listclean, listunknown)
1004 1004 cmp, modified, added, removed, deleted, unknown, ignored, clean = s
1005 1005
1006 1006 # check for any possibly clean files
1007 1007 if parentworking and cmp:
1008 1008 fixup = []
1009 1009 # do a full compare of any files that might have changed
1010 1010 for f in sorted(cmp):
1011 1011 if (f not in ctx1 or ctx2.flags(f) != ctx1.flags(f)
1012 1012 or ctx1[f].cmp(ctx2[f].data())):
1013 1013 modified.append(f)
1014 1014 else:
1015 1015 fixup.append(f)
1016 1016
1017 1017 if listclean:
1018 1018 clean += fixup
1019 1019
1020 1020 # update dirstate for files that are actually clean
1021 1021 if fixup:
1022 1022 try:
1023 1023 # updating the dirstate is optional
1024 1024 # so we don't wait on the lock
1025 1025 wlock = self.wlock(False)
1026 1026 try:
1027 1027 for f in fixup:
1028 1028 self.dirstate.normal(f)
1029 1029 finally:
1030 1030 wlock.release()
1031 1031 except error.LockError:
1032 1032 pass
1033 1033
1034 1034 if not parentworking:
1035 1035 mf1 = mfmatches(ctx1)
1036 1036 if working:
1037 1037 # we are comparing working dir against non-parent
1038 1038 # generate a pseudo-manifest for the working dir
1039 1039 mf2 = mfmatches(self['.'])
1040 1040 for f in cmp + modified + added:
1041 1041 mf2[f] = None
1042 1042 mf2.set(f, ctx2.flags(f))
1043 1043 for f in removed:
1044 1044 if f in mf2:
1045 1045 del mf2[f]
1046 1046 else:
1047 1047 # we are comparing two revisions
1048 1048 deleted, unknown, ignored = [], [], []
1049 1049 mf2 = mfmatches(ctx2)
1050 1050
1051 1051 modified, added, clean = [], [], []
1052 1052 for fn in mf2:
1053 1053 if fn in mf1:
1054 1054 if (mf1.flags(fn) != mf2.flags(fn) or
1055 1055 (mf1[fn] != mf2[fn] and
1056 1056 (mf2[fn] or ctx1[fn].cmp(ctx2[fn].data())))):
1057 1057 modified.append(fn)
1058 1058 elif listclean:
1059 1059 clean.append(fn)
1060 1060 del mf1[fn]
1061 1061 else:
1062 1062 added.append(fn)
1063 1063 removed = mf1.keys()
1064 1064
1065 1065 r = modified, added, removed, deleted, unknown, ignored, clean
1066 1066 [l.sort() for l in r]
1067 1067 return r
1068 1068
1069 1069 def add(self, list):
1070 1070 wlock = self.wlock()
1071 1071 try:
1072 1072 rejected = []
1073 1073 for f in list:
1074 1074 p = self.wjoin(f)
1075 1075 try:
1076 1076 st = os.lstat(p)
1077 1077 except:
1078 1078 self.ui.warn(_("%s does not exist!\n") % f)
1079 1079 rejected.append(f)
1080 1080 continue
1081 1081 if st.st_size > 10000000:
1082 1082 self.ui.warn(_("%s: files over 10MB may cause memory and"
1083 1083 " performance problems\n"
1084 1084 "(use 'hg revert %s' to unadd the file)\n")
1085 1085 % (f, f))
1086 1086 if not (stat.S_ISREG(st.st_mode) or stat.S_ISLNK(st.st_mode)):
1087 1087 self.ui.warn(_("%s not added: only files and symlinks "
1088 1088 "supported currently\n") % f)
1089 1089 rejected.append(p)
1090 1090 elif self.dirstate[f] in 'amn':
1091 1091 self.ui.warn(_("%s already tracked!\n") % f)
1092 1092 elif self.dirstate[f] == 'r':
1093 1093 self.dirstate.normallookup(f)
1094 1094 else:
1095 1095 self.dirstate.add(f)
1096 1096 return rejected
1097 1097 finally:
1098 1098 wlock.release()
1099 1099
1100 1100 def forget(self, list):
1101 1101 wlock = self.wlock()
1102 1102 try:
1103 1103 for f in list:
1104 1104 if self.dirstate[f] != 'a':
1105 1105 self.ui.warn(_("%s not added!\n") % f)
1106 1106 else:
1107 1107 self.dirstate.forget(f)
1108 1108 finally:
1109 1109 wlock.release()
1110 1110
1111 1111 def remove(self, list, unlink=False):
1112 1112 if unlink:
1113 1113 for f in list:
1114 1114 try:
1115 1115 util.unlink(self.wjoin(f))
1116 1116 except OSError, inst:
1117 1117 if inst.errno != errno.ENOENT:
1118 1118 raise
1119 1119 wlock = self.wlock()
1120 1120 try:
1121 1121 for f in list:
1122 1122 if unlink and os.path.exists(self.wjoin(f)):
1123 1123 self.ui.warn(_("%s still exists!\n") % f)
1124 1124 elif self.dirstate[f] == 'a':
1125 1125 self.dirstate.forget(f)
1126 1126 elif f not in self.dirstate:
1127 1127 self.ui.warn(_("%s not tracked!\n") % f)
1128 1128 else:
1129 1129 self.dirstate.remove(f)
1130 1130 finally:
1131 1131 wlock.release()
1132 1132
1133 1133 def undelete(self, list):
1134 1134 manifests = [self.manifest.read(self.changelog.read(p)[0])
1135 1135 for p in self.dirstate.parents() if p != nullid]
1136 1136 wlock = self.wlock()
1137 1137 try:
1138 1138 for f in list:
1139 1139 if self.dirstate[f] != 'r':
1140 1140 self.ui.warn(_("%s not removed!\n") % f)
1141 1141 else:
1142 1142 m = f in manifests[0] and manifests[0] or manifests[1]
1143 1143 t = self.file(f).read(m[f])
1144 1144 self.wwrite(f, t, m.flags(f))
1145 1145 self.dirstate.normal(f)
1146 1146 finally:
1147 1147 wlock.release()
1148 1148
1149 1149 def copy(self, source, dest):
1150 1150 p = self.wjoin(dest)
1151 1151 if not (os.path.exists(p) or os.path.islink(p)):
1152 1152 self.ui.warn(_("%s does not exist!\n") % dest)
1153 1153 elif not (os.path.isfile(p) or os.path.islink(p)):
1154 1154 self.ui.warn(_("copy failed: %s is not a file or a "
1155 1155 "symbolic link\n") % dest)
1156 1156 else:
1157 1157 wlock = self.wlock()
1158 1158 try:
1159 1159 if self.dirstate[dest] in '?r':
1160 1160 self.dirstate.add(dest)
1161 1161 self.dirstate.copy(source, dest)
1162 1162 finally:
1163 1163 wlock.release()
1164 1164
1165 1165 def heads(self, start=None):
1166 1166 heads = self.changelog.heads(start)
1167 1167 # sort the output in rev descending order
1168 1168 heads = [(-self.changelog.rev(h), h) for h in heads]
1169 1169 return [n for (r, n) in sorted(heads)]
1170 1170
1171 1171 def branchheads(self, branch=None, start=None, closed=False):
1172 1172 '''return a (possibly filtered) list of heads for the given branch
1173 1173
1174 1174 Heads are returned in topological order, from newest to oldest.
1175 1175 If branch is None, use the dirstate branch.
1176 1176 If start is not None, return only heads reachable from start.
1177 1177 If closed is True, return heads that are marked as closed as well.
1178 1178 '''
1179 1179 if branch is None:
1180 1180 branch = self[None].branch()
1181 1181 branches = self.branchmap()
1182 1182 if branch not in branches:
1183 1183 return []
1184 1184 # the cache returns heads ordered lowest to highest
1185 1185 bheads = list(reversed(branches[branch]))
1186 1186 if start is not None:
1187 1187 # filter out the heads that cannot be reached from startrev
1188 1188 fbheads = set(self.changelog.nodesbetween([start], bheads)[2])
1189 1189 bheads = [h for h in bheads if h in fbheads]
1190 1190 if not closed:
1191 1191 bheads = [h for h in bheads if
1192 1192 ('close' not in self.changelog.read(h)[5])]
1193 1193 return bheads
1194 1194
1195 1195 def branches(self, nodes):
1196 1196 if not nodes:
1197 1197 nodes = [self.changelog.tip()]
1198 1198 b = []
1199 1199 for n in nodes:
1200 1200 t = n
1201 1201 while 1:
1202 1202 p = self.changelog.parents(n)
1203 1203 if p[1] != nullid or p[0] == nullid:
1204 1204 b.append((t, n, p[0], p[1]))
1205 1205 break
1206 1206 n = p[0]
1207 1207 return b
1208 1208
1209 1209 def between(self, pairs):
1210 1210 r = []
1211 1211
1212 1212 for top, bottom in pairs:
1213 1213 n, l, i = top, [], 0
1214 1214 f = 1
1215 1215
1216 1216 while n != bottom and n != nullid:
1217 1217 p = self.changelog.parents(n)[0]
1218 1218 if i == f:
1219 1219 l.append(n)
1220 1220 f = f * 2
1221 1221 n = p
1222 1222 i += 1
1223 1223
1224 1224 r.append(l)
1225 1225
1226 1226 return r
1227 1227
1228 1228 def findincoming(self, remote, base=None, heads=None, force=False):
1229 1229 """Return list of roots of the subsets of missing nodes from remote
1230 1230
1231 1231 If base dict is specified, assume that these nodes and their parents
1232 1232 exist on the remote side and that no child of a node of base exists
1233 1233 in both remote and self.
1234 1234 Furthermore base will be updated to include the nodes that exists
1235 1235 in self and remote but no children exists in self and remote.
1236 1236 If a list of heads is specified, return only nodes which are heads
1237 1237 or ancestors of these heads.
1238 1238
1239 1239 All the ancestors of base are in self and in remote.
1240 1240 All the descendants of the list returned are missing in self.
1241 1241 (and so we know that the rest of the nodes are missing in remote, see
1242 1242 outgoing)
1243 1243 """
1244 1244 return self.findcommonincoming(remote, base, heads, force)[1]
1245 1245
1246 1246 def findcommonincoming(self, remote, base=None, heads=None, force=False):
1247 1247 """Return a tuple (common, missing roots, heads) used to identify
1248 1248 missing nodes from remote.
1249 1249
1250 1250 If base dict is specified, assume that these nodes and their parents
1251 1251 exist on the remote side and that no child of a node of base exists
1252 1252 in both remote and self.
1253 1253 Furthermore base will be updated to include the nodes that exists
1254 1254 in self and remote but no children exists in self and remote.
1255 1255 If a list of heads is specified, return only nodes which are heads
1256 1256 or ancestors of these heads.
1257 1257
1258 1258 All the ancestors of base are in self and in remote.
1259 1259 """
1260 1260 m = self.changelog.nodemap
1261 1261 search = []
1262 1262 fetch = set()
1263 1263 seen = set()
1264 1264 seenbranch = set()
1265 1265 if base is None:
1266 1266 base = {}
1267 1267
1268 1268 if not heads:
1269 1269 heads = remote.heads()
1270 1270
1271 1271 if self.changelog.tip() == nullid:
1272 1272 base[nullid] = 1
1273 1273 if heads != [nullid]:
1274 1274 return [nullid], [nullid], list(heads)
1275 1275 return [nullid], [], []
1276 1276
1277 1277 # assume we're closer to the tip than the root
1278 1278 # and start by examining the heads
1279 1279 self.ui.status(_("searching for changes\n"))
1280 1280
1281 1281 unknown = []
1282 1282 for h in heads:
1283 1283 if h not in m:
1284 1284 unknown.append(h)
1285 1285 else:
1286 1286 base[h] = 1
1287 1287
1288 1288 heads = unknown
1289 1289 if not unknown:
1290 1290 return base.keys(), [], []
1291 1291
1292 1292 req = set(unknown)
1293 1293 reqcnt = 0
1294 1294
1295 1295 # search through remote branches
1296 1296 # a 'branch' here is a linear segment of history, with four parts:
1297 1297 # head, root, first parent, second parent
1298 1298 # (a branch always has two parents (or none) by definition)
1299 1299 unknown = remote.branches(unknown)
1300 1300 while unknown:
1301 1301 r = []
1302 1302 while unknown:
1303 1303 n = unknown.pop(0)
1304 1304 if n[0] in seen:
1305 1305 continue
1306 1306
1307 1307 self.ui.debug("examining %s:%s\n"
1308 1308 % (short(n[0]), short(n[1])))
1309 1309 if n[0] == nullid: # found the end of the branch
1310 1310 pass
1311 1311 elif n in seenbranch:
1312 1312 self.ui.debug("branch already found\n")
1313 1313 continue
1314 1314 elif n[1] and n[1] in m: # do we know the base?
1315 1315 self.ui.debug("found incomplete branch %s:%s\n"
1316 1316 % (short(n[0]), short(n[1])))
1317 1317 search.append(n[0:2]) # schedule branch range for scanning
1318 1318 seenbranch.add(n)
1319 1319 else:
1320 1320 if n[1] not in seen and n[1] not in fetch:
1321 1321 if n[2] in m and n[3] in m:
1322 1322 self.ui.debug("found new changeset %s\n" %
1323 1323 short(n[1]))
1324 1324 fetch.add(n[1]) # earliest unknown
1325 1325 for p in n[2:4]:
1326 1326 if p in m:
1327 1327 base[p] = 1 # latest known
1328 1328
1329 1329 for p in n[2:4]:
1330 1330 if p not in req and p not in m:
1331 1331 r.append(p)
1332 1332 req.add(p)
1333 1333 seen.add(n[0])
1334 1334
1335 1335 if r:
1336 1336 reqcnt += 1
1337 1337 self.ui.debug("request %d: %s\n" %
1338 1338 (reqcnt, " ".join(map(short, r))))
1339 1339 for p in xrange(0, len(r), 10):
1340 1340 for b in remote.branches(r[p:p+10]):
1341 1341 self.ui.debug("received %s:%s\n" %
1342 1342 (short(b[0]), short(b[1])))
1343 1343 unknown.append(b)
1344 1344
1345 1345 # do binary search on the branches we found
1346 1346 while search:
1347 1347 newsearch = []
1348 1348 reqcnt += 1
1349 1349 for n, l in zip(search, remote.between(search)):
1350 1350 l.append(n[1])
1351 1351 p = n[0]
1352 1352 f = 1
1353 1353 for i in l:
1354 1354 self.ui.debug("narrowing %d:%d %s\n" % (f, len(l), short(i)))
1355 1355 if i in m:
1356 1356 if f <= 2:
1357 1357 self.ui.debug("found new branch changeset %s\n" %
1358 1358 short(p))
1359 1359 fetch.add(p)
1360 1360 base[i] = 1
1361 1361 else:
1362 1362 self.ui.debug("narrowed branch search to %s:%s\n"
1363 1363 % (short(p), short(i)))
1364 1364 newsearch.append((p, i))
1365 1365 break
1366 1366 p, f = i, f * 2
1367 1367 search = newsearch
1368 1368
1369 1369 # sanity check our fetch list
1370 1370 for f in fetch:
1371 1371 if f in m:
1372 1372 raise error.RepoError(_("already have changeset ")
1373 1373 + short(f[:4]))
1374 1374
1375 1375 if base.keys() == [nullid]:
1376 1376 if force:
1377 1377 self.ui.warn(_("warning: repository is unrelated\n"))
1378 1378 else:
1379 1379 raise util.Abort(_("repository is unrelated"))
1380 1380
1381 1381 self.ui.debug("found new changesets starting at " +
1382 1382 " ".join([short(f) for f in fetch]) + "\n")
1383 1383
1384 1384 self.ui.debug("%d total queries\n" % reqcnt)
1385 1385
1386 1386 return base.keys(), list(fetch), heads
1387 1387
1388 1388 def findoutgoing(self, remote, base=None, heads=None, force=False):
1389 1389 """Return list of nodes that are roots of subsets not in remote
1390 1390
1391 1391 If base dict is specified, assume that these nodes and their parents
1392 1392 exist on the remote side.
1393 1393 If a list of heads is specified, return only nodes which are heads
1394 1394 or ancestors of these heads, and return a second element which
1395 1395 contains all remote heads which get new children.
1396 1396 """
1397 1397 if base is None:
1398 1398 base = {}
1399 1399 self.findincoming(remote, base, heads, force=force)
1400 1400
1401 1401 self.ui.debug("common changesets up to "
1402 1402 + " ".join(map(short, base.keys())) + "\n")
1403 1403
1404 1404 remain = set(self.changelog.nodemap)
1405 1405
1406 1406 # prune everything remote has from the tree
1407 1407 remain.remove(nullid)
1408 1408 remove = base.keys()
1409 1409 while remove:
1410 1410 n = remove.pop(0)
1411 1411 if n in remain:
1412 1412 remain.remove(n)
1413 1413 for p in self.changelog.parents(n):
1414 1414 remove.append(p)
1415 1415
1416 1416 # find every node whose parents have been pruned
1417 1417 subset = []
1418 1418 # find every remote head that will get new children
1419 1419 updated_heads = set()
1420 1420 for n in remain:
1421 1421 p1, p2 = self.changelog.parents(n)
1422 1422 if p1 not in remain and p2 not in remain:
1423 1423 subset.append(n)
1424 1424 if heads:
1425 1425 if p1 in heads:
1426 1426 updated_heads.add(p1)
1427 1427 if p2 in heads:
1428 1428 updated_heads.add(p2)
1429 1429
1430 1430 # this is the set of all roots we have to push
1431 1431 if heads:
1432 1432 return subset, list(updated_heads)
1433 1433 else:
1434 1434 return subset
1435 1435
1436 1436 def pull(self, remote, heads=None, force=False):
1437 1437 lock = self.lock()
1438 1438 try:
1439 1439 common, fetch, rheads = self.findcommonincoming(remote, heads=heads,
1440 1440 force=force)
1441 1441 if fetch == [nullid]:
1442 1442 self.ui.status(_("requesting all changes\n"))
1443 1443
1444 1444 if not fetch:
1445 1445 self.ui.status(_("no changes found\n"))
1446 1446 return 0
1447 1447
1448 1448 if heads is None and remote.capable('changegroupsubset'):
1449 1449 heads = rheads
1450 1450
1451 1451 if heads is None:
1452 1452 cg = remote.changegroup(fetch, 'pull')
1453 1453 else:
1454 1454 if not remote.capable('changegroupsubset'):
1455 1455 raise util.Abort(_("Partial pull cannot be done because "
1456 1456 "other repository doesn't support "
1457 1457 "changegroupsubset."))
1458 1458 cg = remote.changegroupsubset(fetch, heads, 'pull')
1459 1459 return self.addchangegroup(cg, 'pull', remote.url())
1460 1460 finally:
1461 1461 lock.release()
1462 1462
1463 1463 def push(self, remote, force=False, revs=None):
1464 1464 # there are two ways to push to remote repo:
1465 1465 #
1466 1466 # addchangegroup assumes local user can lock remote
1467 1467 # repo (local filesystem, old ssh servers).
1468 1468 #
1469 1469 # unbundle assumes local user cannot lock remote repo (new ssh
1470 1470 # servers, http servers).
1471 1471
1472 1472 if remote.capable('unbundle'):
1473 1473 return self.push_unbundle(remote, force, revs)
1474 1474 return self.push_addchangegroup(remote, force, revs)
1475 1475
1476 1476 def prepush(self, remote, force, revs):
1477 1477 '''Analyze the local and remote repositories and determine which
1478 1478 changesets need to be pushed to the remote. Return a tuple
1479 1479 (changegroup, remoteheads). changegroup is a readable file-like
1480 1480 object whose read() returns successive changegroup chunks ready to
1481 1481 be sent over the wire. remoteheads is the list of remote heads.
1482 1482 '''
1483 1483 common = {}
1484 1484 remote_heads = remote.heads()
1485 1485 inc = self.findincoming(remote, common, remote_heads, force=force)
1486 1486
1487 1487 update, updated_heads = self.findoutgoing(remote, common, remote_heads)
1488 1488 msng_cl, bases, heads = self.changelog.nodesbetween(update, revs)
1489 1489
1490 1490 def checkbranch(lheads, rheads, updatelb):
1491 1491 '''
1492 1492 check whether there are more local heads than remote heads on
1493 1493 a specific branch.
1494 1494
1495 1495 lheads: local branch heads
1496 1496 rheads: remote branch heads
1497 1497 updatelb: outgoing local branch bases
1498 1498 '''
1499 1499
1500 1500 warn = 0
1501 1501
1502 1502 if not revs and len(lheads) > len(rheads):
1503 1503 warn = 1
1504 1504 else:
1505 1505 # add local heads involved in the push
1506 1506 updatelheads = [self.changelog.heads(x, lheads)
1507 1507 for x in updatelb]
1508 1508 newheads = set(sum(updatelheads, [])) & set(lheads)
1509 1509
1510 1510 if not newheads:
1511 1511 return True
1512 1512
1513 1513 # add heads we don't have or that are not involved in the push
1514 1514 for r in rheads:
1515 1515 if r in self.changelog.nodemap:
1516 1516 desc = self.changelog.heads(r, heads)
1517 1517 l = [h for h in heads if h in desc]
1518 1518 if not l:
1519 1519 newheads.add(r)
1520 1520 else:
1521 1521 newheads.add(r)
1522 1522 if len(newheads) > len(rheads):
1523 1523 warn = 1
1524 1524
1525 1525 if warn:
1526 1526 if not rheads: # new branch requires --force
1527 1527 self.ui.warn(_("abort: push creates new"
1528 1528 " remote branch '%s'!\n") %
1529 1529 self[lheads[0]].branch())
1530 1530 else:
1531 1531 self.ui.warn(_("abort: push creates new remote heads!\n"))
1532 1532
1533 1533 self.ui.status(_("(did you forget to merge?"
1534 1534 " use push -f to force)\n"))
1535 1535 return False
1536 1536 return True
1537 1537
1538 1538 if not bases:
1539 1539 self.ui.status(_("no changes found\n"))
1540 1540 return None, 1
1541 1541 elif not force:
1542 1542 # Check for each named branch if we're creating new remote heads.
1543 1543 # To be a remote head after push, node must be either:
1544 1544 # - unknown locally
1545 1545 # - a local outgoing head descended from update
1546 1546 # - a remote head that's known locally and not
1547 1547 # ancestral to an outgoing head
1548 1548 #
1549 1549 # New named branches cannot be created without --force.
1550 1550
1551 1551 if remote_heads != [nullid]:
1552 1552 if remote.capable('branchmap'):
1553 1553 localhds = {}
1554 1554 if not revs:
1555 1555 localhds = self.branchmap()
1556 1556 else:
1557 1557 for n in heads:
1558 1558 branch = self[n].branch()
1559 1559 if branch in localhds:
1560 1560 localhds[branch].append(n)
1561 1561 else:
1562 1562 localhds[branch] = [n]
1563 1563
1564 1564 remotehds = remote.branchmap()
1565 1565
1566 1566 for lh in localhds:
1567 1567 if lh in remotehds:
1568 1568 rheads = remotehds[lh]
1569 1569 else:
1570 1570 rheads = []
1571 1571 lheads = localhds[lh]
1572 1572 if not checkbranch(lheads, rheads, update):
1573 1573 return None, 0
1574 1574 else:
1575 1575 if not checkbranch(heads, remote_heads, update):
1576 1576 return None, 0
1577 1577
1578 1578 if inc:
1579 1579 self.ui.warn(_("note: unsynced remote changes!\n"))
1580 1580
1581 1581
1582 1582 if revs is None:
1583 1583 # use the fast path, no race possible on push
1584 1584 nodes = self.changelog.findmissing(common.keys())
1585 1585 cg = self._changegroup(nodes, 'push')
1586 1586 else:
1587 1587 cg = self.changegroupsubset(update, revs, 'push')
1588 1588 return cg, remote_heads
1589 1589
1590 1590 def push_addchangegroup(self, remote, force, revs):
1591 1591 lock = remote.lock()
1592 1592 try:
1593 1593 ret = self.prepush(remote, force, revs)
1594 1594 if ret[0] is not None:
1595 1595 cg, remote_heads = ret
1596 1596 return remote.addchangegroup(cg, 'push', self.url())
1597 1597 return ret[1]
1598 1598 finally:
1599 1599 lock.release()
1600 1600
1601 1601 def push_unbundle(self, remote, force, revs):
1602 1602 # local repo finds heads on server, finds out what revs it
1603 1603 # must push. once revs transferred, if server finds it has
1604 1604 # different heads (someone else won commit/push race), server
1605 1605 # aborts.
1606 1606
1607 1607 ret = self.prepush(remote, force, revs)
1608 1608 if ret[0] is not None:
1609 1609 cg, remote_heads = ret
1610 1610 if force: remote_heads = ['force']
1611 1611 return remote.unbundle(cg, remote_heads, 'push')
1612 1612 return ret[1]
1613 1613
1614 1614 def changegroupinfo(self, nodes, source):
1615 1615 if self.ui.verbose or source == 'bundle':
1616 1616 self.ui.status(_("%d changesets found\n") % len(nodes))
1617 1617 if self.ui.debugflag:
1618 1618 self.ui.debug("list of changesets:\n")
1619 1619 for node in nodes:
1620 1620 self.ui.debug("%s\n" % hex(node))
1621 1621
1622 1622 def changegroupsubset(self, bases, heads, source, extranodes=None):
1623 1623 """Compute a changegroup consisting of all the nodes that are
1624 1624 descendents of any of the bases and ancestors of any of the heads.
1625 1625 Return a chunkbuffer object whose read() method will return
1626 1626 successive changegroup chunks.
1627 1627
1628 1628 It is fairly complex as determining which filenodes and which
1629 1629 manifest nodes need to be included for the changeset to be complete
1630 1630 is non-trivial.
1631 1631
1632 1632 Another wrinkle is doing the reverse, figuring out which changeset in
1633 1633 the changegroup a particular filenode or manifestnode belongs to.
1634 1634
1635 1635 The caller can specify some nodes that must be included in the
1636 1636 changegroup using the extranodes argument. It should be a dict
1637 1637 where the keys are the filenames (or 1 for the manifest), and the
1638 1638 values are lists of (node, linknode) tuples, where node is a wanted
1639 1639 node and linknode is the changelog node that should be transmitted as
1640 1640 the linkrev.
1641 1641 """
1642 1642
1643 1643 # Set up some initial variables
1644 1644 # Make it easy to refer to self.changelog
1645 1645 cl = self.changelog
1646 1646 # msng is short for missing - compute the list of changesets in this
1647 1647 # changegroup.
1648 1648 if not bases:
1649 1649 bases = [nullid]
1650 1650 msng_cl_lst, bases, heads = cl.nodesbetween(bases, heads)
1651 1651
1652 1652 if extranodes is None:
1653 1653 # can we go through the fast path ?
1654 1654 heads.sort()
1655 1655 allheads = self.heads()
1656 1656 allheads.sort()
1657 1657 if heads == allheads:
1658 1658 return self._changegroup(msng_cl_lst, source)
1659 1659
1660 1660 # slow path
1661 1661 self.hook('preoutgoing', throw=True, source=source)
1662 1662
1663 1663 self.changegroupinfo(msng_cl_lst, source)
1664 1664 # Some bases may turn out to be superfluous, and some heads may be
1665 1665 # too. nodesbetween will return the minimal set of bases and heads
1666 1666 # necessary to re-create the changegroup.
1667 1667
1668 1668 # Known heads are the list of heads that it is assumed the recipient
1669 1669 # of this changegroup will know about.
1670 1670 knownheads = set()
1671 1671 # We assume that all parents of bases are known heads.
1672 1672 for n in bases:
1673 1673 knownheads.update(cl.parents(n))
1674 1674 knownheads.discard(nullid)
1675 1675 knownheads = list(knownheads)
1676 1676 if knownheads:
1677 1677 # Now that we know what heads are known, we can compute which
1678 1678 # changesets are known. The recipient must know about all
1679 1679 # changesets required to reach the known heads from the null
1680 1680 # changeset.
1681 1681 has_cl_set, junk, junk = cl.nodesbetween(None, knownheads)
1682 1682 junk = None
1683 1683 # Transform the list into a set.
1684 1684 has_cl_set = set(has_cl_set)
1685 1685 else:
1686 1686 # If there were no known heads, the recipient cannot be assumed to
1687 1687 # know about any changesets.
1688 1688 has_cl_set = set()
1689 1689
1690 1690 # Make it easy to refer to self.manifest
1691 1691 mnfst = self.manifest
1692 1692 # We don't know which manifests are missing yet
1693 1693 msng_mnfst_set = {}
1694 1694 # Nor do we know which filenodes are missing.
1695 1695 msng_filenode_set = {}
1696 1696
1697 1697 junk = mnfst.index[len(mnfst) - 1] # Get around a bug in lazyindex
1698 1698 junk = None
1699 1699
1700 1700 # A changeset always belongs to itself, so the changenode lookup
1701 1701 # function for a changenode is identity.
1702 1702 def identity(x):
1703 1703 return x
1704 1704
1705 1705 # If we determine that a particular file or manifest node must be a
1706 1706 # node that the recipient of the changegroup will already have, we can
1707 1707 # also assume the recipient will have all the parents. This function
1708 1708 # prunes them from the set of missing nodes.
1709 1709 def prune_parents(revlog, hasset, msngset):
1710 haslst = list(hasset)
1711 haslst.sort(key=revlog.rev)
1712 for node in haslst:
1713 parentlst = [p for p in revlog.parents(node) if p != nullid]
1714 while parentlst:
1715 n = parentlst.pop()
1716 if n not in hasset:
1717 hasset.add(n)
1718 p = [p for p in revlog.parents(n) if p != nullid]
1719 parentlst.extend(p)
1720 for n in hasset:
1721 msngset.pop(n, None)
1710 for r in revlog.ancestors(*[revlog.rev(n) for n in hasset]):
1711 msngset.pop(revlog.node(r), None)
1722 1712
1723 1713 # This is a function generating function used to set up an environment
1724 1714 # for the inner function to execute in.
1725 1715 def manifest_and_file_collector(changedfileset):
1726 1716 # This is an information gathering function that gathers
1727 1717 # information from each changeset node that goes out as part of
1728 1718 # the changegroup. The information gathered is a list of which
1729 1719 # manifest nodes are potentially required (the recipient may
1730 1720 # already have them) and total list of all files which were
1731 1721 # changed in any changeset in the changegroup.
1732 1722 #
1733 1723 # We also remember the first changenode we saw any manifest
1734 1724 # referenced by so we can later determine which changenode 'owns'
1735 1725 # the manifest.
1736 1726 def collect_manifests_and_files(clnode):
1737 1727 c = cl.read(clnode)
1738 1728 for f in c[3]:
1739 1729 # This is to make sure we only have one instance of each
1740 1730 # filename string for each filename.
1741 1731 changedfileset.setdefault(f, f)
1742 1732 msng_mnfst_set.setdefault(c[0], clnode)
1743 1733 return collect_manifests_and_files
1744 1734
1745 1735 # Figure out which manifest nodes (of the ones we think might be part
1746 1736 # of the changegroup) the recipient must know about and remove them
1747 1737 # from the changegroup.
1748 1738 def prune_manifests():
1749 1739 has_mnfst_set = set()
1750 1740 for n in msng_mnfst_set:
1751 1741 # If a 'missing' manifest thinks it belongs to a changenode
1752 1742 # the recipient is assumed to have, obviously the recipient
1753 1743 # must have that manifest.
1754 1744 linknode = cl.node(mnfst.linkrev(mnfst.rev(n)))
1755 1745 if linknode in has_cl_set:
1756 1746 has_mnfst_set.add(n)
1757 1747 prune_parents(mnfst, has_mnfst_set, msng_mnfst_set)
1758 1748
1759 1749 # Use the information collected in collect_manifests_and_files to say
1760 1750 # which changenode any manifestnode belongs to.
1761 1751 def lookup_manifest_link(mnfstnode):
1762 1752 return msng_mnfst_set[mnfstnode]
1763 1753
1764 1754 # A function generating function that sets up the initial environment
1765 1755 # the inner function.
1766 1756 def filenode_collector(changedfiles):
1767 1757 next_rev = [0]
1768 1758 # This gathers information from each manifestnode included in the
1769 1759 # changegroup about which filenodes the manifest node references
1770 1760 # so we can include those in the changegroup too.
1771 1761 #
1772 1762 # It also remembers which changenode each filenode belongs to. It
1773 1763 # does this by assuming the a filenode belongs to the changenode
1774 1764 # the first manifest that references it belongs to.
1775 1765 def collect_msng_filenodes(mnfstnode):
1776 1766 r = mnfst.rev(mnfstnode)
1777 1767 if r == next_rev[0]:
1778 1768 # If the last rev we looked at was the one just previous,
1779 1769 # we only need to see a diff.
1780 1770 deltamf = mnfst.readdelta(mnfstnode)
1781 1771 # For each line in the delta
1782 1772 for f, fnode in deltamf.iteritems():
1783 1773 f = changedfiles.get(f, None)
1784 1774 # And if the file is in the list of files we care
1785 1775 # about.
1786 1776 if f is not None:
1787 1777 # Get the changenode this manifest belongs to
1788 1778 clnode = msng_mnfst_set[mnfstnode]
1789 1779 # Create the set of filenodes for the file if
1790 1780 # there isn't one already.
1791 1781 ndset = msng_filenode_set.setdefault(f, {})
1792 1782 # And set the filenode's changelog node to the
1793 1783 # manifest's if it hasn't been set already.
1794 1784 ndset.setdefault(fnode, clnode)
1795 1785 else:
1796 1786 # Otherwise we need a full manifest.
1797 1787 m = mnfst.read(mnfstnode)
1798 1788 # For every file in we care about.
1799 1789 for f in changedfiles:
1800 1790 fnode = m.get(f, None)
1801 1791 # If it's in the manifest
1802 1792 if fnode is not None:
1803 1793 # See comments above.
1804 1794 clnode = msng_mnfst_set[mnfstnode]
1805 1795 ndset = msng_filenode_set.setdefault(f, {})
1806 1796 ndset.setdefault(fnode, clnode)
1807 1797 # Remember the revision we hope to see next.
1808 1798 next_rev[0] = r + 1
1809 1799 return collect_msng_filenodes
1810 1800
1811 1801 # We have a list of filenodes we think we need for a file, lets remove
1812 1802 # all those we know the recipient must have.
1813 1803 def prune_filenodes(f, filerevlog):
1814 1804 msngset = msng_filenode_set[f]
1815 1805 hasset = set()
1816 1806 # If a 'missing' filenode thinks it belongs to a changenode we
1817 1807 # assume the recipient must have, then the recipient must have
1818 1808 # that filenode.
1819 1809 for n in msngset:
1820 1810 clnode = cl.node(filerevlog.linkrev(filerevlog.rev(n)))
1821 1811 if clnode in has_cl_set:
1822 1812 hasset.add(n)
1823 1813 prune_parents(filerevlog, hasset, msngset)
1824 1814
1825 1815 # A function generator function that sets up the a context for the
1826 1816 # inner function.
1827 1817 def lookup_filenode_link_func(fname):
1828 1818 msngset = msng_filenode_set[fname]
1829 1819 # Lookup the changenode the filenode belongs to.
1830 1820 def lookup_filenode_link(fnode):
1831 1821 return msngset[fnode]
1832 1822 return lookup_filenode_link
1833 1823
1834 1824 # Add the nodes that were explicitly requested.
1835 1825 def add_extra_nodes(name, nodes):
1836 1826 if not extranodes or name not in extranodes:
1837 1827 return
1838 1828
1839 1829 for node, linknode in extranodes[name]:
1840 1830 if node not in nodes:
1841 1831 nodes[node] = linknode
1842 1832
1843 1833 # Now that we have all theses utility functions to help out and
1844 1834 # logically divide up the task, generate the group.
1845 1835 def gengroup():
1846 1836 # The set of changed files starts empty.
1847 1837 changedfiles = {}
1848 1838 # Create a changenode group generator that will call our functions
1849 1839 # back to lookup the owning changenode and collect information.
1850 1840 group = cl.group(msng_cl_lst, identity,
1851 1841 manifest_and_file_collector(changedfiles))
1852 1842 for chnk in group:
1853 1843 yield chnk
1854 1844
1855 1845 # The list of manifests has been collected by the generator
1856 1846 # calling our functions back.
1857 1847 prune_manifests()
1858 1848 add_extra_nodes(1, msng_mnfst_set)
1859 1849 msng_mnfst_lst = msng_mnfst_set.keys()
1860 1850 # Sort the manifestnodes by revision number.
1861 1851 msng_mnfst_lst.sort(key=mnfst.rev)
1862 1852 # Create a generator for the manifestnodes that calls our lookup
1863 1853 # and data collection functions back.
1864 1854 group = mnfst.group(msng_mnfst_lst, lookup_manifest_link,
1865 1855 filenode_collector(changedfiles))
1866 1856 for chnk in group:
1867 1857 yield chnk
1868 1858
1869 1859 # These are no longer needed, dereference and toss the memory for
1870 1860 # them.
1871 1861 msng_mnfst_lst = None
1872 1862 msng_mnfst_set.clear()
1873 1863
1874 1864 if extranodes:
1875 1865 for fname in extranodes:
1876 1866 if isinstance(fname, int):
1877 1867 continue
1878 1868 msng_filenode_set.setdefault(fname, {})
1879 1869 changedfiles[fname] = 1
1880 1870 # Go through all our files in order sorted by name.
1881 1871 for fname in sorted(changedfiles):
1882 1872 filerevlog = self.file(fname)
1883 1873 if not len(filerevlog):
1884 1874 raise util.Abort(_("empty or missing revlog for %s") % fname)
1885 1875 # Toss out the filenodes that the recipient isn't really
1886 1876 # missing.
1887 1877 if fname in msng_filenode_set:
1888 1878 prune_filenodes(fname, filerevlog)
1889 1879 add_extra_nodes(fname, msng_filenode_set[fname])
1890 1880 msng_filenode_lst = msng_filenode_set[fname].keys()
1891 1881 else:
1892 1882 msng_filenode_lst = []
1893 1883 # If any filenodes are left, generate the group for them,
1894 1884 # otherwise don't bother.
1895 1885 if len(msng_filenode_lst) > 0:
1896 1886 yield changegroup.chunkheader(len(fname))
1897 1887 yield fname
1898 1888 # Sort the filenodes by their revision #
1899 1889 msng_filenode_lst.sort(key=filerevlog.rev)
1900 1890 # Create a group generator and only pass in a changenode
1901 1891 # lookup function as we need to collect no information
1902 1892 # from filenodes.
1903 1893 group = filerevlog.group(msng_filenode_lst,
1904 1894 lookup_filenode_link_func(fname))
1905 1895 for chnk in group:
1906 1896 yield chnk
1907 1897 if fname in msng_filenode_set:
1908 1898 # Don't need this anymore, toss it to free memory.
1909 1899 del msng_filenode_set[fname]
1910 1900 # Signal that no more groups are left.
1911 1901 yield changegroup.closechunk()
1912 1902
1913 1903 if msng_cl_lst:
1914 1904 self.hook('outgoing', node=hex(msng_cl_lst[0]), source=source)
1915 1905
1916 1906 return util.chunkbuffer(gengroup())
1917 1907
1918 1908 def changegroup(self, basenodes, source):
1919 1909 # to avoid a race we use changegroupsubset() (issue1320)
1920 1910 return self.changegroupsubset(basenodes, self.heads(), source)
1921 1911
1922 1912 def _changegroup(self, nodes, source):
1923 1913 """Compute the changegroup of all nodes that we have that a recipient
1924 1914 doesn't. Return a chunkbuffer object whose read() method will return
1925 1915 successive changegroup chunks.
1926 1916
1927 1917 This is much easier than the previous function as we can assume that
1928 1918 the recipient has any changenode we aren't sending them.
1929 1919
1930 1920 nodes is the set of nodes to send"""
1931 1921
1932 1922 self.hook('preoutgoing', throw=True, source=source)
1933 1923
1934 1924 cl = self.changelog
1935 1925 revset = set([cl.rev(n) for n in nodes])
1936 1926 self.changegroupinfo(nodes, source)
1937 1927
1938 1928 def identity(x):
1939 1929 return x
1940 1930
1941 1931 def gennodelst(log):
1942 1932 for r in log:
1943 1933 if log.linkrev(r) in revset:
1944 1934 yield log.node(r)
1945 1935
1946 1936 def changed_file_collector(changedfileset):
1947 1937 def collect_changed_files(clnode):
1948 1938 c = cl.read(clnode)
1949 1939 changedfileset.update(c[3])
1950 1940 return collect_changed_files
1951 1941
1952 1942 def lookuprevlink_func(revlog):
1953 1943 def lookuprevlink(n):
1954 1944 return cl.node(revlog.linkrev(revlog.rev(n)))
1955 1945 return lookuprevlink
1956 1946
1957 1947 def gengroup():
1958 1948 '''yield a sequence of changegroup chunks (strings)'''
1959 1949 # construct a list of all changed files
1960 1950 changedfiles = set()
1961 1951
1962 1952 for chnk in cl.group(nodes, identity,
1963 1953 changed_file_collector(changedfiles)):
1964 1954 yield chnk
1965 1955
1966 1956 mnfst = self.manifest
1967 1957 nodeiter = gennodelst(mnfst)
1968 1958 for chnk in mnfst.group(nodeiter, lookuprevlink_func(mnfst)):
1969 1959 yield chnk
1970 1960
1971 1961 for fname in sorted(changedfiles):
1972 1962 filerevlog = self.file(fname)
1973 1963 if not len(filerevlog):
1974 1964 raise util.Abort(_("empty or missing revlog for %s") % fname)
1975 1965 nodeiter = gennodelst(filerevlog)
1976 1966 nodeiter = list(nodeiter)
1977 1967 if nodeiter:
1978 1968 yield changegroup.chunkheader(len(fname))
1979 1969 yield fname
1980 1970 lookup = lookuprevlink_func(filerevlog)
1981 1971 for chnk in filerevlog.group(nodeiter, lookup):
1982 1972 yield chnk
1983 1973
1984 1974 yield changegroup.closechunk()
1985 1975
1986 1976 if nodes:
1987 1977 self.hook('outgoing', node=hex(nodes[0]), source=source)
1988 1978
1989 1979 return util.chunkbuffer(gengroup())
1990 1980
1991 1981 def addchangegroup(self, source, srctype, url, emptyok=False):
1992 1982 """add changegroup to repo.
1993 1983
1994 1984 return values:
1995 1985 - nothing changed or no source: 0
1996 1986 - more heads than before: 1+added heads (2..n)
1997 1987 - less heads than before: -1-removed heads (-2..-n)
1998 1988 - number of heads stays the same: 1
1999 1989 """
2000 1990 def csmap(x):
2001 1991 self.ui.debug("add changeset %s\n" % short(x))
2002 1992 return len(cl)
2003 1993
2004 1994 def revmap(x):
2005 1995 return cl.rev(x)
2006 1996
2007 1997 if not source:
2008 1998 return 0
2009 1999
2010 2000 self.hook('prechangegroup', throw=True, source=srctype, url=url)
2011 2001
2012 2002 changesets = files = revisions = 0
2013 2003
2014 2004 # write changelog data to temp files so concurrent readers will not see
2015 2005 # inconsistent view
2016 2006 cl = self.changelog
2017 2007 cl.delayupdate()
2018 2008 oldheads = len(cl.heads())
2019 2009
2020 2010 tr = self.transaction()
2021 2011 try:
2022 2012 trp = weakref.proxy(tr)
2023 2013 # pull off the changeset group
2024 2014 self.ui.status(_("adding changesets\n"))
2025 2015 clstart = len(cl)
2026 2016 chunkiter = changegroup.chunkiter(source)
2027 2017 if cl.addgroup(chunkiter, csmap, trp) is None and not emptyok:
2028 2018 raise util.Abort(_("received changelog group is empty"))
2029 2019 clend = len(cl)
2030 2020 changesets = clend - clstart
2031 2021
2032 2022 # pull off the manifest group
2033 2023 self.ui.status(_("adding manifests\n"))
2034 2024 chunkiter = changegroup.chunkiter(source)
2035 2025 # no need to check for empty manifest group here:
2036 2026 # if the result of the merge of 1 and 2 is the same in 3 and 4,
2037 2027 # no new manifest will be created and the manifest group will
2038 2028 # be empty during the pull
2039 2029 self.manifest.addgroup(chunkiter, revmap, trp)
2040 2030
2041 2031 # process the files
2042 2032 self.ui.status(_("adding file changes\n"))
2043 2033 while 1:
2044 2034 f = changegroup.getchunk(source)
2045 2035 if not f:
2046 2036 break
2047 2037 self.ui.debug("adding %s revisions\n" % f)
2048 2038 fl = self.file(f)
2049 2039 o = len(fl)
2050 2040 chunkiter = changegroup.chunkiter(source)
2051 2041 if fl.addgroup(chunkiter, revmap, trp) is None:
2052 2042 raise util.Abort(_("received file revlog group is empty"))
2053 2043 revisions += len(fl) - o
2054 2044 files += 1
2055 2045
2056 2046 newheads = len(cl.heads())
2057 2047 heads = ""
2058 2048 if oldheads and newheads != oldheads:
2059 2049 heads = _(" (%+d heads)") % (newheads - oldheads)
2060 2050
2061 2051 self.ui.status(_("added %d changesets"
2062 2052 " with %d changes to %d files%s\n")
2063 2053 % (changesets, revisions, files, heads))
2064 2054
2065 2055 if changesets > 0:
2066 2056 p = lambda: cl.writepending() and self.root or ""
2067 2057 self.hook('pretxnchangegroup', throw=True,
2068 2058 node=hex(cl.node(clstart)), source=srctype,
2069 2059 url=url, pending=p)
2070 2060
2071 2061 # make changelog see real files again
2072 2062 cl.finalize(trp)
2073 2063
2074 2064 tr.close()
2075 2065 finally:
2076 2066 del tr
2077 2067
2078 2068 if changesets > 0:
2079 2069 # forcefully update the on-disk branch cache
2080 2070 self.ui.debug("updating the branch cache\n")
2081 2071 self.branchtags()
2082 2072 self.hook("changegroup", node=hex(cl.node(clstart)),
2083 2073 source=srctype, url=url)
2084 2074
2085 2075 for i in xrange(clstart, clend):
2086 2076 self.hook("incoming", node=hex(cl.node(i)),
2087 2077 source=srctype, url=url)
2088 2078
2089 2079 # never return 0 here:
2090 2080 if newheads < oldheads:
2091 2081 return newheads - oldheads - 1
2092 2082 else:
2093 2083 return newheads - oldheads + 1
2094 2084
2095 2085
2096 2086 def stream_in(self, remote):
2097 2087 fp = remote.stream_out()
2098 2088 l = fp.readline()
2099 2089 try:
2100 2090 resp = int(l)
2101 2091 except ValueError:
2102 2092 raise error.ResponseError(
2103 2093 _('Unexpected response from remote server:'), l)
2104 2094 if resp == 1:
2105 2095 raise util.Abort(_('operation forbidden by server'))
2106 2096 elif resp == 2:
2107 2097 raise util.Abort(_('locking the remote repository failed'))
2108 2098 elif resp != 0:
2109 2099 raise util.Abort(_('the server sent an unknown error code'))
2110 2100 self.ui.status(_('streaming all changes\n'))
2111 2101 l = fp.readline()
2112 2102 try:
2113 2103 total_files, total_bytes = map(int, l.split(' ', 1))
2114 2104 except (ValueError, TypeError):
2115 2105 raise error.ResponseError(
2116 2106 _('Unexpected response from remote server:'), l)
2117 2107 self.ui.status(_('%d files to transfer, %s of data\n') %
2118 2108 (total_files, util.bytecount(total_bytes)))
2119 2109 start = time.time()
2120 2110 for i in xrange(total_files):
2121 2111 # XXX doesn't support '\n' or '\r' in filenames
2122 2112 l = fp.readline()
2123 2113 try:
2124 2114 name, size = l.split('\0', 1)
2125 2115 size = int(size)
2126 2116 except (ValueError, TypeError):
2127 2117 raise error.ResponseError(
2128 2118 _('Unexpected response from remote server:'), l)
2129 2119 self.ui.debug('adding %s (%s)\n' % (name, util.bytecount(size)))
2130 2120 # for backwards compat, name was partially encoded
2131 2121 ofp = self.sopener(store.decodedir(name), 'w')
2132 2122 for chunk in util.filechunkiter(fp, limit=size):
2133 2123 ofp.write(chunk)
2134 2124 ofp.close()
2135 2125 elapsed = time.time() - start
2136 2126 if elapsed <= 0:
2137 2127 elapsed = 0.001
2138 2128 self.ui.status(_('transferred %s in %.1f seconds (%s/sec)\n') %
2139 2129 (util.bytecount(total_bytes), elapsed,
2140 2130 util.bytecount(total_bytes / elapsed)))
2141 2131 self.invalidate()
2142 2132 return len(self.heads()) + 1
2143 2133
2144 2134 def clone(self, remote, heads=[], stream=False):
2145 2135 '''clone remote repository.
2146 2136
2147 2137 keyword arguments:
2148 2138 heads: list of revs to clone (forces use of pull)
2149 2139 stream: use streaming clone if possible'''
2150 2140
2151 2141 # now, all clients that can request uncompressed clones can
2152 2142 # read repo formats supported by all servers that can serve
2153 2143 # them.
2154 2144
2155 2145 # if revlog format changes, client will have to check version
2156 2146 # and format flags on "stream" capability, and use
2157 2147 # uncompressed only if compatible.
2158 2148
2159 2149 if stream and not heads and remote.capable('stream'):
2160 2150 return self.stream_in(remote)
2161 2151 return self.pull(remote, heads)
2162 2152
2163 2153 # used to avoid circular references so destructors work
2164 2154 def aftertrans(files):
2165 2155 renamefiles = [tuple(t) for t in files]
2166 2156 def a():
2167 2157 for src, dest in renamefiles:
2168 2158 util.rename(src, dest)
2169 2159 return a
2170 2160
2171 2161 def instance(ui, path, create):
2172 2162 return localrepository(ui, util.drop_scheme('file', path), create)
2173 2163
2174 2164 def islocal(path):
2175 2165 return True
General Comments 0
You need to be logged in to leave comments. Login now