##// END OF EJS Templates
changegroup: track changelog to manifest revision map explicitly...
Gregory Szorc -
r39034:40374b4a default
parent child Browse files
Show More
@@ -1,1419 +1,1419 b''
1 # changegroup.py - Mercurial changegroup manipulation functions
1 # changegroup.py - Mercurial changegroup manipulation functions
2 #
2 #
3 # Copyright 2006 Matt Mackall <mpm@selenic.com>
3 # Copyright 2006 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import os
10 import os
11 import struct
11 import struct
12 import weakref
12 import weakref
13
13
14 from .i18n import _
14 from .i18n import _
15 from .node import (
15 from .node import (
16 hex,
16 hex,
17 nullid,
17 nullid,
18 nullrev,
18 nullrev,
19 short,
19 short,
20 )
20 )
21
21
22 from .thirdparty import (
22 from .thirdparty import (
23 attr,
23 attr,
24 )
24 )
25
25
26 from . import (
26 from . import (
27 dagutil,
27 dagutil,
28 error,
28 error,
29 manifest,
29 manifest,
30 match as matchmod,
30 match as matchmod,
31 mdiff,
31 mdiff,
32 phases,
32 phases,
33 pycompat,
33 pycompat,
34 repository,
34 repository,
35 revlog,
35 revlog,
36 util,
36 util,
37 )
37 )
38
38
39 from .utils import (
39 from .utils import (
40 stringutil,
40 stringutil,
41 )
41 )
42
42
43 _CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")
43 _CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")
44 _CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")
44 _CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")
45 _CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")
45 _CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")
46
46
47 LFS_REQUIREMENT = 'lfs'
47 LFS_REQUIREMENT = 'lfs'
48
48
49 readexactly = util.readexactly
49 readexactly = util.readexactly
50
50
51 def getchunk(stream):
51 def getchunk(stream):
52 """return the next chunk from stream as a string"""
52 """return the next chunk from stream as a string"""
53 d = readexactly(stream, 4)
53 d = readexactly(stream, 4)
54 l = struct.unpack(">l", d)[0]
54 l = struct.unpack(">l", d)[0]
55 if l <= 4:
55 if l <= 4:
56 if l:
56 if l:
57 raise error.Abort(_("invalid chunk length %d") % l)
57 raise error.Abort(_("invalid chunk length %d") % l)
58 return ""
58 return ""
59 return readexactly(stream, l - 4)
59 return readexactly(stream, l - 4)
60
60
61 def chunkheader(length):
61 def chunkheader(length):
62 """return a changegroup chunk header (string)"""
62 """return a changegroup chunk header (string)"""
63 return struct.pack(">l", length + 4)
63 return struct.pack(">l", length + 4)
64
64
65 def closechunk():
65 def closechunk():
66 """return a changegroup chunk header (string) for a zero-length chunk"""
66 """return a changegroup chunk header (string) for a zero-length chunk"""
67 return struct.pack(">l", 0)
67 return struct.pack(">l", 0)
68
68
69 def _fileheader(path):
69 def _fileheader(path):
70 """Obtain a changegroup chunk header for a named path."""
70 """Obtain a changegroup chunk header for a named path."""
71 return chunkheader(len(path)) + path
71 return chunkheader(len(path)) + path
72
72
73 def writechunks(ui, chunks, filename, vfs=None):
73 def writechunks(ui, chunks, filename, vfs=None):
74 """Write chunks to a file and return its filename.
74 """Write chunks to a file and return its filename.
75
75
76 The stream is assumed to be a bundle file.
76 The stream is assumed to be a bundle file.
77 Existing files will not be overwritten.
77 Existing files will not be overwritten.
78 If no filename is specified, a temporary file is created.
78 If no filename is specified, a temporary file is created.
79 """
79 """
80 fh = None
80 fh = None
81 cleanup = None
81 cleanup = None
82 try:
82 try:
83 if filename:
83 if filename:
84 if vfs:
84 if vfs:
85 fh = vfs.open(filename, "wb")
85 fh = vfs.open(filename, "wb")
86 else:
86 else:
87 # Increase default buffer size because default is usually
87 # Increase default buffer size because default is usually
88 # small (4k is common on Linux).
88 # small (4k is common on Linux).
89 fh = open(filename, "wb", 131072)
89 fh = open(filename, "wb", 131072)
90 else:
90 else:
91 fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
91 fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
92 fh = os.fdopen(fd, r"wb")
92 fh = os.fdopen(fd, r"wb")
93 cleanup = filename
93 cleanup = filename
94 for c in chunks:
94 for c in chunks:
95 fh.write(c)
95 fh.write(c)
96 cleanup = None
96 cleanup = None
97 return filename
97 return filename
98 finally:
98 finally:
99 if fh is not None:
99 if fh is not None:
100 fh.close()
100 fh.close()
101 if cleanup is not None:
101 if cleanup is not None:
102 if filename and vfs:
102 if filename and vfs:
103 vfs.unlink(cleanup)
103 vfs.unlink(cleanup)
104 else:
104 else:
105 os.unlink(cleanup)
105 os.unlink(cleanup)
106
106
107 class cg1unpacker(object):
107 class cg1unpacker(object):
108 """Unpacker for cg1 changegroup streams.
108 """Unpacker for cg1 changegroup streams.
109
109
110 A changegroup unpacker handles the framing of the revision data in
110 A changegroup unpacker handles the framing of the revision data in
111 the wire format. Most consumers will want to use the apply()
111 the wire format. Most consumers will want to use the apply()
112 method to add the changes from the changegroup to a repository.
112 method to add the changes from the changegroup to a repository.
113
113
114 If you're forwarding a changegroup unmodified to another consumer,
114 If you're forwarding a changegroup unmodified to another consumer,
115 use getchunks(), which returns an iterator of changegroup
115 use getchunks(), which returns an iterator of changegroup
116 chunks. This is mostly useful for cases where you need to know the
116 chunks. This is mostly useful for cases where you need to know the
117 data stream has ended by observing the end of the changegroup.
117 data stream has ended by observing the end of the changegroup.
118
118
119 deltachunk() is useful only if you're applying delta data. Most
119 deltachunk() is useful only if you're applying delta data. Most
120 consumers should prefer apply() instead.
120 consumers should prefer apply() instead.
121
121
122 A few other public methods exist. Those are used only for
122 A few other public methods exist. Those are used only for
123 bundlerepo and some debug commands - their use is discouraged.
123 bundlerepo and some debug commands - their use is discouraged.
124 """
124 """
125 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
125 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
126 deltaheadersize = deltaheader.size
126 deltaheadersize = deltaheader.size
127 version = '01'
127 version = '01'
128 _grouplistcount = 1 # One list of files after the manifests
128 _grouplistcount = 1 # One list of files after the manifests
129
129
130 def __init__(self, fh, alg, extras=None):
130 def __init__(self, fh, alg, extras=None):
131 if alg is None:
131 if alg is None:
132 alg = 'UN'
132 alg = 'UN'
133 if alg not in util.compengines.supportedbundletypes:
133 if alg not in util.compengines.supportedbundletypes:
134 raise error.Abort(_('unknown stream compression type: %s')
134 raise error.Abort(_('unknown stream compression type: %s')
135 % alg)
135 % alg)
136 if alg == 'BZ':
136 if alg == 'BZ':
137 alg = '_truncatedBZ'
137 alg = '_truncatedBZ'
138
138
139 compengine = util.compengines.forbundletype(alg)
139 compengine = util.compengines.forbundletype(alg)
140 self._stream = compengine.decompressorreader(fh)
140 self._stream = compengine.decompressorreader(fh)
141 self._type = alg
141 self._type = alg
142 self.extras = extras or {}
142 self.extras = extras or {}
143 self.callback = None
143 self.callback = None
144
144
145 # These methods (compressed, read, seek, tell) all appear to only
145 # These methods (compressed, read, seek, tell) all appear to only
146 # be used by bundlerepo, but it's a little hard to tell.
146 # be used by bundlerepo, but it's a little hard to tell.
147 def compressed(self):
147 def compressed(self):
148 return self._type is not None and self._type != 'UN'
148 return self._type is not None and self._type != 'UN'
149 def read(self, l):
149 def read(self, l):
150 return self._stream.read(l)
150 return self._stream.read(l)
151 def seek(self, pos):
151 def seek(self, pos):
152 return self._stream.seek(pos)
152 return self._stream.seek(pos)
153 def tell(self):
153 def tell(self):
154 return self._stream.tell()
154 return self._stream.tell()
155 def close(self):
155 def close(self):
156 return self._stream.close()
156 return self._stream.close()
157
157
158 def _chunklength(self):
158 def _chunklength(self):
159 d = readexactly(self._stream, 4)
159 d = readexactly(self._stream, 4)
160 l = struct.unpack(">l", d)[0]
160 l = struct.unpack(">l", d)[0]
161 if l <= 4:
161 if l <= 4:
162 if l:
162 if l:
163 raise error.Abort(_("invalid chunk length %d") % l)
163 raise error.Abort(_("invalid chunk length %d") % l)
164 return 0
164 return 0
165 if self.callback:
165 if self.callback:
166 self.callback()
166 self.callback()
167 return l - 4
167 return l - 4
168
168
169 def changelogheader(self):
169 def changelogheader(self):
170 """v10 does not have a changelog header chunk"""
170 """v10 does not have a changelog header chunk"""
171 return {}
171 return {}
172
172
173 def manifestheader(self):
173 def manifestheader(self):
174 """v10 does not have a manifest header chunk"""
174 """v10 does not have a manifest header chunk"""
175 return {}
175 return {}
176
176
177 def filelogheader(self):
177 def filelogheader(self):
178 """return the header of the filelogs chunk, v10 only has the filename"""
178 """return the header of the filelogs chunk, v10 only has the filename"""
179 l = self._chunklength()
179 l = self._chunklength()
180 if not l:
180 if not l:
181 return {}
181 return {}
182 fname = readexactly(self._stream, l)
182 fname = readexactly(self._stream, l)
183 return {'filename': fname}
183 return {'filename': fname}
184
184
185 def _deltaheader(self, headertuple, prevnode):
185 def _deltaheader(self, headertuple, prevnode):
186 node, p1, p2, cs = headertuple
186 node, p1, p2, cs = headertuple
187 if prevnode is None:
187 if prevnode is None:
188 deltabase = p1
188 deltabase = p1
189 else:
189 else:
190 deltabase = prevnode
190 deltabase = prevnode
191 flags = 0
191 flags = 0
192 return node, p1, p2, deltabase, cs, flags
192 return node, p1, p2, deltabase, cs, flags
193
193
194 def deltachunk(self, prevnode):
194 def deltachunk(self, prevnode):
195 l = self._chunklength()
195 l = self._chunklength()
196 if not l:
196 if not l:
197 return {}
197 return {}
198 headerdata = readexactly(self._stream, self.deltaheadersize)
198 headerdata = readexactly(self._stream, self.deltaheadersize)
199 header = self.deltaheader.unpack(headerdata)
199 header = self.deltaheader.unpack(headerdata)
200 delta = readexactly(self._stream, l - self.deltaheadersize)
200 delta = readexactly(self._stream, l - self.deltaheadersize)
201 node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
201 node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
202 return (node, p1, p2, cs, deltabase, delta, flags)
202 return (node, p1, p2, cs, deltabase, delta, flags)
203
203
204 def getchunks(self):
204 def getchunks(self):
205 """returns all the chunks contains in the bundle
205 """returns all the chunks contains in the bundle
206
206
207 Used when you need to forward the binary stream to a file or another
207 Used when you need to forward the binary stream to a file or another
208 network API. To do so, it parse the changegroup data, otherwise it will
208 network API. To do so, it parse the changegroup data, otherwise it will
209 block in case of sshrepo because it don't know the end of the stream.
209 block in case of sshrepo because it don't know the end of the stream.
210 """
210 """
211 # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
211 # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
212 # and a list of filelogs. For changegroup 3, we expect 4 parts:
212 # and a list of filelogs. For changegroup 3, we expect 4 parts:
213 # changelog, manifestlog, a list of tree manifestlogs, and a list of
213 # changelog, manifestlog, a list of tree manifestlogs, and a list of
214 # filelogs.
214 # filelogs.
215 #
215 #
216 # Changelog and manifestlog parts are terminated with empty chunks. The
216 # Changelog and manifestlog parts are terminated with empty chunks. The
217 # tree and file parts are a list of entry sections. Each entry section
217 # tree and file parts are a list of entry sections. Each entry section
218 # is a series of chunks terminating in an empty chunk. The list of these
218 # is a series of chunks terminating in an empty chunk. The list of these
219 # entry sections is terminated in yet another empty chunk, so we know
219 # entry sections is terminated in yet another empty chunk, so we know
220 # we've reached the end of the tree/file list when we reach an empty
220 # we've reached the end of the tree/file list when we reach an empty
221 # chunk that was proceeded by no non-empty chunks.
221 # chunk that was proceeded by no non-empty chunks.
222
222
223 parts = 0
223 parts = 0
224 while parts < 2 + self._grouplistcount:
224 while parts < 2 + self._grouplistcount:
225 noentries = True
225 noentries = True
226 while True:
226 while True:
227 chunk = getchunk(self)
227 chunk = getchunk(self)
228 if not chunk:
228 if not chunk:
229 # The first two empty chunks represent the end of the
229 # The first two empty chunks represent the end of the
230 # changelog and the manifestlog portions. The remaining
230 # changelog and the manifestlog portions. The remaining
231 # empty chunks represent either A) the end of individual
231 # empty chunks represent either A) the end of individual
232 # tree or file entries in the file list, or B) the end of
232 # tree or file entries in the file list, or B) the end of
233 # the entire list. It's the end of the entire list if there
233 # the entire list. It's the end of the entire list if there
234 # were no entries (i.e. noentries is True).
234 # were no entries (i.e. noentries is True).
235 if parts < 2:
235 if parts < 2:
236 parts += 1
236 parts += 1
237 elif noentries:
237 elif noentries:
238 parts += 1
238 parts += 1
239 break
239 break
240 noentries = False
240 noentries = False
241 yield chunkheader(len(chunk))
241 yield chunkheader(len(chunk))
242 pos = 0
242 pos = 0
243 while pos < len(chunk):
243 while pos < len(chunk):
244 next = pos + 2**20
244 next = pos + 2**20
245 yield chunk[pos:next]
245 yield chunk[pos:next]
246 pos = next
246 pos = next
247 yield closechunk()
247 yield closechunk()
248
248
249 def _unpackmanifests(self, repo, revmap, trp, prog):
249 def _unpackmanifests(self, repo, revmap, trp, prog):
250 self.callback = prog.increment
250 self.callback = prog.increment
251 # no need to check for empty manifest group here:
251 # no need to check for empty manifest group here:
252 # if the result of the merge of 1 and 2 is the same in 3 and 4,
252 # if the result of the merge of 1 and 2 is the same in 3 and 4,
253 # no new manifest will be created and the manifest group will
253 # no new manifest will be created and the manifest group will
254 # be empty during the pull
254 # be empty during the pull
255 self.manifestheader()
255 self.manifestheader()
256 deltas = self.deltaiter()
256 deltas = self.deltaiter()
257 repo.manifestlog.addgroup(deltas, revmap, trp)
257 repo.manifestlog.addgroup(deltas, revmap, trp)
258 prog.complete()
258 prog.complete()
259 self.callback = None
259 self.callback = None
260
260
261 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
261 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
262 expectedtotal=None):
262 expectedtotal=None):
263 """Add the changegroup returned by source.read() to this repo.
263 """Add the changegroup returned by source.read() to this repo.
264 srctype is a string like 'push', 'pull', or 'unbundle'. url is
264 srctype is a string like 'push', 'pull', or 'unbundle'. url is
265 the URL of the repo where this changegroup is coming from.
265 the URL of the repo where this changegroup is coming from.
266
266
267 Return an integer summarizing the change to this repo:
267 Return an integer summarizing the change to this repo:
268 - nothing changed or no source: 0
268 - nothing changed or no source: 0
269 - more heads than before: 1+added heads (2..n)
269 - more heads than before: 1+added heads (2..n)
270 - fewer heads than before: -1-removed heads (-2..-n)
270 - fewer heads than before: -1-removed heads (-2..-n)
271 - number of heads stays the same: 1
271 - number of heads stays the same: 1
272 """
272 """
273 repo = repo.unfiltered()
273 repo = repo.unfiltered()
274 def csmap(x):
274 def csmap(x):
275 repo.ui.debug("add changeset %s\n" % short(x))
275 repo.ui.debug("add changeset %s\n" % short(x))
276 return len(cl)
276 return len(cl)
277
277
278 def revmap(x):
278 def revmap(x):
279 return cl.rev(x)
279 return cl.rev(x)
280
280
281 changesets = files = revisions = 0
281 changesets = files = revisions = 0
282
282
283 try:
283 try:
284 # The transaction may already carry source information. In this
284 # The transaction may already carry source information. In this
285 # case we use the top level data. We overwrite the argument
285 # case we use the top level data. We overwrite the argument
286 # because we need to use the top level value (if they exist)
286 # because we need to use the top level value (if they exist)
287 # in this function.
287 # in this function.
288 srctype = tr.hookargs.setdefault('source', srctype)
288 srctype = tr.hookargs.setdefault('source', srctype)
289 url = tr.hookargs.setdefault('url', url)
289 url = tr.hookargs.setdefault('url', url)
290 repo.hook('prechangegroup',
290 repo.hook('prechangegroup',
291 throw=True, **pycompat.strkwargs(tr.hookargs))
291 throw=True, **pycompat.strkwargs(tr.hookargs))
292
292
293 # write changelog data to temp files so concurrent readers
293 # write changelog data to temp files so concurrent readers
294 # will not see an inconsistent view
294 # will not see an inconsistent view
295 cl = repo.changelog
295 cl = repo.changelog
296 cl.delayupdate(tr)
296 cl.delayupdate(tr)
297 oldheads = set(cl.heads())
297 oldheads = set(cl.heads())
298
298
299 trp = weakref.proxy(tr)
299 trp = weakref.proxy(tr)
300 # pull off the changeset group
300 # pull off the changeset group
301 repo.ui.status(_("adding changesets\n"))
301 repo.ui.status(_("adding changesets\n"))
302 clstart = len(cl)
302 clstart = len(cl)
303 progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
303 progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
304 total=expectedtotal)
304 total=expectedtotal)
305 self.callback = progress.increment
305 self.callback = progress.increment
306
306
307 efiles = set()
307 efiles = set()
308 def onchangelog(cl, node):
308 def onchangelog(cl, node):
309 efiles.update(cl.readfiles(node))
309 efiles.update(cl.readfiles(node))
310
310
311 self.changelogheader()
311 self.changelogheader()
312 deltas = self.deltaiter()
312 deltas = self.deltaiter()
313 cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
313 cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
314 efiles = len(efiles)
314 efiles = len(efiles)
315
315
316 if not cgnodes:
316 if not cgnodes:
317 repo.ui.develwarn('applied empty changegroup',
317 repo.ui.develwarn('applied empty changegroup',
318 config='warn-empty-changegroup')
318 config='warn-empty-changegroup')
319 clend = len(cl)
319 clend = len(cl)
320 changesets = clend - clstart
320 changesets = clend - clstart
321 progress.complete()
321 progress.complete()
322 self.callback = None
322 self.callback = None
323
323
324 # pull off the manifest group
324 # pull off the manifest group
325 repo.ui.status(_("adding manifests\n"))
325 repo.ui.status(_("adding manifests\n"))
326 # We know that we'll never have more manifests than we had
326 # We know that we'll never have more manifests than we had
327 # changesets.
327 # changesets.
328 progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
328 progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
329 total=changesets)
329 total=changesets)
330 self._unpackmanifests(repo, revmap, trp, progress)
330 self._unpackmanifests(repo, revmap, trp, progress)
331
331
332 needfiles = {}
332 needfiles = {}
333 if repo.ui.configbool('server', 'validate'):
333 if repo.ui.configbool('server', 'validate'):
334 cl = repo.changelog
334 cl = repo.changelog
335 ml = repo.manifestlog
335 ml = repo.manifestlog
336 # validate incoming csets have their manifests
336 # validate incoming csets have their manifests
337 for cset in pycompat.xrange(clstart, clend):
337 for cset in pycompat.xrange(clstart, clend):
338 mfnode = cl.changelogrevision(cset).manifest
338 mfnode = cl.changelogrevision(cset).manifest
339 mfest = ml[mfnode].readdelta()
339 mfest = ml[mfnode].readdelta()
340 # store file cgnodes we must see
340 # store file cgnodes we must see
341 for f, n in mfest.iteritems():
341 for f, n in mfest.iteritems():
342 needfiles.setdefault(f, set()).add(n)
342 needfiles.setdefault(f, set()).add(n)
343
343
344 # process the files
344 # process the files
345 repo.ui.status(_("adding file changes\n"))
345 repo.ui.status(_("adding file changes\n"))
346 newrevs, newfiles = _addchangegroupfiles(
346 newrevs, newfiles = _addchangegroupfiles(
347 repo, self, revmap, trp, efiles, needfiles)
347 repo, self, revmap, trp, efiles, needfiles)
348 revisions += newrevs
348 revisions += newrevs
349 files += newfiles
349 files += newfiles
350
350
351 deltaheads = 0
351 deltaheads = 0
352 if oldheads:
352 if oldheads:
353 heads = cl.heads()
353 heads = cl.heads()
354 deltaheads = len(heads) - len(oldheads)
354 deltaheads = len(heads) - len(oldheads)
355 for h in heads:
355 for h in heads:
356 if h not in oldheads and repo[h].closesbranch():
356 if h not in oldheads and repo[h].closesbranch():
357 deltaheads -= 1
357 deltaheads -= 1
358 htext = ""
358 htext = ""
359 if deltaheads:
359 if deltaheads:
360 htext = _(" (%+d heads)") % deltaheads
360 htext = _(" (%+d heads)") % deltaheads
361
361
362 repo.ui.status(_("added %d changesets"
362 repo.ui.status(_("added %d changesets"
363 " with %d changes to %d files%s\n")
363 " with %d changes to %d files%s\n")
364 % (changesets, revisions, files, htext))
364 % (changesets, revisions, files, htext))
365 repo.invalidatevolatilesets()
365 repo.invalidatevolatilesets()
366
366
367 if changesets > 0:
367 if changesets > 0:
368 if 'node' not in tr.hookargs:
368 if 'node' not in tr.hookargs:
369 tr.hookargs['node'] = hex(cl.node(clstart))
369 tr.hookargs['node'] = hex(cl.node(clstart))
370 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
370 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
371 hookargs = dict(tr.hookargs)
371 hookargs = dict(tr.hookargs)
372 else:
372 else:
373 hookargs = dict(tr.hookargs)
373 hookargs = dict(tr.hookargs)
374 hookargs['node'] = hex(cl.node(clstart))
374 hookargs['node'] = hex(cl.node(clstart))
375 hookargs['node_last'] = hex(cl.node(clend - 1))
375 hookargs['node_last'] = hex(cl.node(clend - 1))
376 repo.hook('pretxnchangegroup',
376 repo.hook('pretxnchangegroup',
377 throw=True, **pycompat.strkwargs(hookargs))
377 throw=True, **pycompat.strkwargs(hookargs))
378
378
379 added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
379 added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
380 phaseall = None
380 phaseall = None
381 if srctype in ('push', 'serve'):
381 if srctype in ('push', 'serve'):
382 # Old servers can not push the boundary themselves.
382 # Old servers can not push the boundary themselves.
383 # New servers won't push the boundary if changeset already
383 # New servers won't push the boundary if changeset already
384 # exists locally as secret
384 # exists locally as secret
385 #
385 #
386 # We should not use added here but the list of all change in
386 # We should not use added here but the list of all change in
387 # the bundle
387 # the bundle
388 if repo.publishing():
388 if repo.publishing():
389 targetphase = phaseall = phases.public
389 targetphase = phaseall = phases.public
390 else:
390 else:
391 # closer target phase computation
391 # closer target phase computation
392
392
393 # Those changesets have been pushed from the
393 # Those changesets have been pushed from the
394 # outside, their phases are going to be pushed
394 # outside, their phases are going to be pushed
395 # alongside. Therefor `targetphase` is
395 # alongside. Therefor `targetphase` is
396 # ignored.
396 # ignored.
397 targetphase = phaseall = phases.draft
397 targetphase = phaseall = phases.draft
398 if added:
398 if added:
399 phases.registernew(repo, tr, targetphase, added)
399 phases.registernew(repo, tr, targetphase, added)
400 if phaseall is not None:
400 if phaseall is not None:
401 phases.advanceboundary(repo, tr, phaseall, cgnodes)
401 phases.advanceboundary(repo, tr, phaseall, cgnodes)
402
402
403 if changesets > 0:
403 if changesets > 0:
404
404
405 def runhooks():
405 def runhooks():
406 # These hooks run when the lock releases, not when the
406 # These hooks run when the lock releases, not when the
407 # transaction closes. So it's possible for the changelog
407 # transaction closes. So it's possible for the changelog
408 # to have changed since we last saw it.
408 # to have changed since we last saw it.
409 if clstart >= len(repo):
409 if clstart >= len(repo):
410 return
410 return
411
411
412 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
412 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
413
413
414 for n in added:
414 for n in added:
415 args = hookargs.copy()
415 args = hookargs.copy()
416 args['node'] = hex(n)
416 args['node'] = hex(n)
417 del args['node_last']
417 del args['node_last']
418 repo.hook("incoming", **pycompat.strkwargs(args))
418 repo.hook("incoming", **pycompat.strkwargs(args))
419
419
420 newheads = [h for h in repo.heads()
420 newheads = [h for h in repo.heads()
421 if h not in oldheads]
421 if h not in oldheads]
422 repo.ui.log("incoming",
422 repo.ui.log("incoming",
423 "%d incoming changes - new heads: %s\n",
423 "%d incoming changes - new heads: %s\n",
424 len(added),
424 len(added),
425 ', '.join([hex(c[:6]) for c in newheads]))
425 ', '.join([hex(c[:6]) for c in newheads]))
426
426
427 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
427 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
428 lambda tr: repo._afterlock(runhooks))
428 lambda tr: repo._afterlock(runhooks))
429 finally:
429 finally:
430 repo.ui.flush()
430 repo.ui.flush()
431 # never return 0 here:
431 # never return 0 here:
432 if deltaheads < 0:
432 if deltaheads < 0:
433 ret = deltaheads - 1
433 ret = deltaheads - 1
434 else:
434 else:
435 ret = deltaheads + 1
435 ret = deltaheads + 1
436 return ret
436 return ret
437
437
438 def deltaiter(self):
438 def deltaiter(self):
439 """
439 """
440 returns an iterator of the deltas in this changegroup
440 returns an iterator of the deltas in this changegroup
441
441
442 Useful for passing to the underlying storage system to be stored.
442 Useful for passing to the underlying storage system to be stored.
443 """
443 """
444 chain = None
444 chain = None
445 for chunkdata in iter(lambda: self.deltachunk(chain), {}):
445 for chunkdata in iter(lambda: self.deltachunk(chain), {}):
446 # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
446 # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
447 yield chunkdata
447 yield chunkdata
448 chain = chunkdata[0]
448 chain = chunkdata[0]
449
449
450 class cg2unpacker(cg1unpacker):
450 class cg2unpacker(cg1unpacker):
451 """Unpacker for cg2 streams.
451 """Unpacker for cg2 streams.
452
452
453 cg2 streams add support for generaldelta, so the delta header
453 cg2 streams add support for generaldelta, so the delta header
454 format is slightly different. All other features about the data
454 format is slightly different. All other features about the data
455 remain the same.
455 remain the same.
456 """
456 """
457 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
457 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
458 deltaheadersize = deltaheader.size
458 deltaheadersize = deltaheader.size
459 version = '02'
459 version = '02'
460
460
461 def _deltaheader(self, headertuple, prevnode):
461 def _deltaheader(self, headertuple, prevnode):
462 node, p1, p2, deltabase, cs = headertuple
462 node, p1, p2, deltabase, cs = headertuple
463 flags = 0
463 flags = 0
464 return node, p1, p2, deltabase, cs, flags
464 return node, p1, p2, deltabase, cs, flags
465
465
466 class cg3unpacker(cg2unpacker):
466 class cg3unpacker(cg2unpacker):
467 """Unpacker for cg3 streams.
467 """Unpacker for cg3 streams.
468
468
469 cg3 streams add support for exchanging treemanifests and revlog
469 cg3 streams add support for exchanging treemanifests and revlog
470 flags. It adds the revlog flags to the delta header and an empty chunk
470 flags. It adds the revlog flags to the delta header and an empty chunk
471 separating manifests and files.
471 separating manifests and files.
472 """
472 """
473 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
473 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
474 deltaheadersize = deltaheader.size
474 deltaheadersize = deltaheader.size
475 version = '03'
475 version = '03'
476 _grouplistcount = 2 # One list of manifests and one list of files
476 _grouplistcount = 2 # One list of manifests and one list of files
477
477
478 def _deltaheader(self, headertuple, prevnode):
478 def _deltaheader(self, headertuple, prevnode):
479 node, p1, p2, deltabase, cs, flags = headertuple
479 node, p1, p2, deltabase, cs, flags = headertuple
480 return node, p1, p2, deltabase, cs, flags
480 return node, p1, p2, deltabase, cs, flags
481
481
482 def _unpackmanifests(self, repo, revmap, trp, prog):
482 def _unpackmanifests(self, repo, revmap, trp, prog):
483 super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
483 super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
484 for chunkdata in iter(self.filelogheader, {}):
484 for chunkdata in iter(self.filelogheader, {}):
485 # If we get here, there are directory manifests in the changegroup
485 # If we get here, there are directory manifests in the changegroup
486 d = chunkdata["filename"]
486 d = chunkdata["filename"]
487 repo.ui.debug("adding %s revisions\n" % d)
487 repo.ui.debug("adding %s revisions\n" % d)
488 dirlog = repo.manifestlog._revlog.dirlog(d)
488 dirlog = repo.manifestlog._revlog.dirlog(d)
489 deltas = self.deltaiter()
489 deltas = self.deltaiter()
490 if not dirlog.addgroup(deltas, revmap, trp):
490 if not dirlog.addgroup(deltas, revmap, trp):
491 raise error.Abort(_("received dir revlog group is empty"))
491 raise error.Abort(_("received dir revlog group is empty"))
492
492
493 class headerlessfixup(object):
493 class headerlessfixup(object):
494 def __init__(self, fh, h):
494 def __init__(self, fh, h):
495 self._h = h
495 self._h = h
496 self._fh = fh
496 self._fh = fh
497 def read(self, n):
497 def read(self, n):
498 if self._h:
498 if self._h:
499 d, self._h = self._h[:n], self._h[n:]
499 d, self._h = self._h[:n], self._h[n:]
500 if len(d) < n:
500 if len(d) < n:
501 d += readexactly(self._fh, n - len(d))
501 d += readexactly(self._fh, n - len(d))
502 return d
502 return d
503 return readexactly(self._fh, n)
503 return readexactly(self._fh, n)
504
504
505 @attr.s(slots=True, frozen=True)
505 @attr.s(slots=True, frozen=True)
506 class revisiondelta(object):
506 class revisiondelta(object):
507 """Describes a delta entry in a changegroup.
507 """Describes a delta entry in a changegroup.
508
508
509 Captured data is sufficient to serialize the delta into multiple
509 Captured data is sufficient to serialize the delta into multiple
510 formats.
510 formats.
511 """
511 """
512 # 20 byte node of this revision.
512 # 20 byte node of this revision.
513 node = attr.ib()
513 node = attr.ib()
514 # 20 byte nodes of parent revisions.
514 # 20 byte nodes of parent revisions.
515 p1node = attr.ib()
515 p1node = attr.ib()
516 p2node = attr.ib()
516 p2node = attr.ib()
517 # 20 byte node of node this delta is against.
517 # 20 byte node of node this delta is against.
518 basenode = attr.ib()
518 basenode = attr.ib()
519 # 20 byte node of changeset revision this delta is associated with.
519 # 20 byte node of changeset revision this delta is associated with.
520 linknode = attr.ib()
520 linknode = attr.ib()
521 # 2 bytes of flags to apply to revision data.
521 # 2 bytes of flags to apply to revision data.
522 flags = attr.ib()
522 flags = attr.ib()
523 # Iterable of chunks holding raw delta data.
523 # Iterable of chunks holding raw delta data.
524 deltachunks = attr.ib()
524 deltachunks = attr.ib()
525
525
526 def _sortnodesnormal(store, nodes, reorder):
526 def _sortnodesnormal(store, nodes, reorder):
527 """Sort nodes for changegroup generation and turn into revnums."""
527 """Sort nodes for changegroup generation and turn into revnums."""
528 # for generaldelta revlogs, we linearize the revs; this will both be
528 # for generaldelta revlogs, we linearize the revs; this will both be
529 # much quicker and generate a much smaller bundle
529 # much quicker and generate a much smaller bundle
530 if (store._generaldelta and reorder is None) or reorder:
530 if (store._generaldelta and reorder is None) or reorder:
531 dag = dagutil.revlogdag(store)
531 dag = dagutil.revlogdag(store)
532 return dag.linearize(set(store.rev(n) for n in nodes))
532 return dag.linearize(set(store.rev(n) for n in nodes))
533 else:
533 else:
534 return sorted([store.rev(n) for n in nodes])
534 return sorted([store.rev(n) for n in nodes])
535
535
536 def _sortnodesellipsis(store, nodes, cl, lookup):
536 def _sortnodesellipsis(store, nodes, cl, lookup):
537 """Sort nodes for changegroup generation and turn into revnums."""
537 """Sort nodes for changegroup generation and turn into revnums."""
538 # Ellipses serving mode.
538 # Ellipses serving mode.
539 #
539 #
540 # In a perfect world, we'd generate better ellipsis-ified graphs
540 # In a perfect world, we'd generate better ellipsis-ified graphs
541 # for non-changelog revlogs. In practice, we haven't started doing
541 # for non-changelog revlogs. In practice, we haven't started doing
542 # that yet, so the resulting DAGs for the manifestlog and filelogs
542 # that yet, so the resulting DAGs for the manifestlog and filelogs
543 # are actually full of bogus parentage on all the ellipsis
543 # are actually full of bogus parentage on all the ellipsis
544 # nodes. This has the side effect that, while the contents are
544 # nodes. This has the side effect that, while the contents are
545 # correct, the individual DAGs might be completely out of whack in
545 # correct, the individual DAGs might be completely out of whack in
546 # a case like 882681bc3166 and its ancestors (back about 10
546 # a case like 882681bc3166 and its ancestors (back about 10
547 # revisions or so) in the main hg repo.
547 # revisions or so) in the main hg repo.
548 #
548 #
549 # The one invariant we *know* holds is that the new (potentially
549 # The one invariant we *know* holds is that the new (potentially
550 # bogus) DAG shape will be valid if we order the nodes in the
550 # bogus) DAG shape will be valid if we order the nodes in the
551 # order that they're introduced in dramatis personae by the
551 # order that they're introduced in dramatis personae by the
552 # changelog, so what we do is we sort the non-changelog histories
552 # changelog, so what we do is we sort the non-changelog histories
553 # by the order in which they are used by the changelog.
553 # by the order in which they are used by the changelog.
554 key = lambda n: cl.rev(lookup(n))
554 key = lambda n: cl.rev(lookup(n))
555 return [store.rev(n) for n in sorted(nodes, key=key)]
555 return [store.rev(n) for n in sorted(nodes, key=key)]
556
556
557 def _revisiondeltanormal(store, rev, prev, linknode, deltaparentfn):
557 def _revisiondeltanormal(store, rev, prev, linknode, deltaparentfn):
558 """Construct a revision delta for non-ellipses changegroup generation."""
558 """Construct a revision delta for non-ellipses changegroup generation."""
559 node = store.node(rev)
559 node = store.node(rev)
560 p1, p2 = store.parentrevs(rev)
560 p1, p2 = store.parentrevs(rev)
561 base = deltaparentfn(store, rev, p1, p2, prev)
561 base = deltaparentfn(store, rev, p1, p2, prev)
562
562
563 prefix = ''
563 prefix = ''
564 if store.iscensored(base) or store.iscensored(rev):
564 if store.iscensored(base) or store.iscensored(rev):
565 try:
565 try:
566 delta = store.revision(node, raw=True)
566 delta = store.revision(node, raw=True)
567 except error.CensoredNodeError as e:
567 except error.CensoredNodeError as e:
568 delta = e.tombstone
568 delta = e.tombstone
569 if base == nullrev:
569 if base == nullrev:
570 prefix = mdiff.trivialdiffheader(len(delta))
570 prefix = mdiff.trivialdiffheader(len(delta))
571 else:
571 else:
572 baselen = store.rawsize(base)
572 baselen = store.rawsize(base)
573 prefix = mdiff.replacediffheader(baselen, len(delta))
573 prefix = mdiff.replacediffheader(baselen, len(delta))
574 elif base == nullrev:
574 elif base == nullrev:
575 delta = store.revision(node, raw=True)
575 delta = store.revision(node, raw=True)
576 prefix = mdiff.trivialdiffheader(len(delta))
576 prefix = mdiff.trivialdiffheader(len(delta))
577 else:
577 else:
578 delta = store.revdiff(base, rev)
578 delta = store.revdiff(base, rev)
579 p1n, p2n = store.parents(node)
579 p1n, p2n = store.parents(node)
580
580
581 return revisiondelta(
581 return revisiondelta(
582 node=node,
582 node=node,
583 p1node=p1n,
583 p1node=p1n,
584 p2node=p2n,
584 p2node=p2n,
585 basenode=store.node(base),
585 basenode=store.node(base),
586 linknode=linknode,
586 linknode=linknode,
587 flags=store.flags(rev),
587 flags=store.flags(rev),
588 deltachunks=(prefix, delta),
588 deltachunks=(prefix, delta),
589 )
589 )
590
590
591 class cgpacker(object):
591 class cgpacker(object):
592 def __init__(self, repo, filematcher, version, allowreorder,
592 def __init__(self, repo, filematcher, version, allowreorder,
593 deltaparentfn, builddeltaheader, manifestsend,
593 deltaparentfn, builddeltaheader, manifestsend,
594 bundlecaps=None, ellipses=False,
594 bundlecaps=None, ellipses=False,
595 shallow=False, ellipsisroots=None, fullnodes=None):
595 shallow=False, ellipsisroots=None, fullnodes=None):
596 """Given a source repo, construct a bundler.
596 """Given a source repo, construct a bundler.
597
597
598 filematcher is a matcher that matches on files to include in the
598 filematcher is a matcher that matches on files to include in the
599 changegroup. Used to facilitate sparse changegroups.
599 changegroup. Used to facilitate sparse changegroups.
600
600
601 allowreorder controls whether reordering of revisions is allowed.
601 allowreorder controls whether reordering of revisions is allowed.
602 This value is used when ``bundle.reorder`` is ``auto`` or isn't
602 This value is used when ``bundle.reorder`` is ``auto`` or isn't
603 set.
603 set.
604
604
605 deltaparentfn is a callable that resolves the delta parent for
605 deltaparentfn is a callable that resolves the delta parent for
606 a specific revision.
606 a specific revision.
607
607
608 builddeltaheader is a callable that constructs the header for a group
608 builddeltaheader is a callable that constructs the header for a group
609 delta.
609 delta.
610
610
611 manifestsend is a chunk to send after manifests have been fully emitted.
611 manifestsend is a chunk to send after manifests have been fully emitted.
612
612
613 ellipses indicates whether ellipsis serving mode is enabled.
613 ellipses indicates whether ellipsis serving mode is enabled.
614
614
615 bundlecaps is optional and can be used to specify the set of
615 bundlecaps is optional and can be used to specify the set of
616 capabilities which can be used to build the bundle. While bundlecaps is
616 capabilities which can be used to build the bundle. While bundlecaps is
617 unused in core Mercurial, extensions rely on this feature to communicate
617 unused in core Mercurial, extensions rely on this feature to communicate
618 capabilities to customize the changegroup packer.
618 capabilities to customize the changegroup packer.
619
619
620 shallow indicates whether shallow data might be sent. The packer may
620 shallow indicates whether shallow data might be sent. The packer may
621 need to pack file contents not introduced by the changes being packed.
621 need to pack file contents not introduced by the changes being packed.
622
622
623 fullnodes is the set of changelog nodes which should not be ellipsis
623 fullnodes is the set of changelog nodes which should not be ellipsis
624 nodes. We store this rather than the set of nodes that should be
624 nodes. We store this rather than the set of nodes that should be
625 ellipsis because for very large histories we expect this to be
625 ellipsis because for very large histories we expect this to be
626 significantly smaller.
626 significantly smaller.
627 """
627 """
628 assert filematcher
628 assert filematcher
629 self._filematcher = filematcher
629 self._filematcher = filematcher
630
630
631 self.version = version
631 self.version = version
632 self._deltaparentfn = deltaparentfn
632 self._deltaparentfn = deltaparentfn
633 self._builddeltaheader = builddeltaheader
633 self._builddeltaheader = builddeltaheader
634 self._manifestsend = manifestsend
634 self._manifestsend = manifestsend
635 self._ellipses = ellipses
635 self._ellipses = ellipses
636
636
637 # Set of capabilities we can use to build the bundle.
637 # Set of capabilities we can use to build the bundle.
638 if bundlecaps is None:
638 if bundlecaps is None:
639 bundlecaps = set()
639 bundlecaps = set()
640 self._bundlecaps = bundlecaps
640 self._bundlecaps = bundlecaps
641 self._isshallow = shallow
641 self._isshallow = shallow
642 self._fullclnodes = fullnodes
642 self._fullclnodes = fullnodes
643
643
644 # Maps ellipsis revs to their roots at the changelog level.
644 # Maps ellipsis revs to their roots at the changelog level.
645 self._precomputedellipsis = ellipsisroots
645 self._precomputedellipsis = ellipsisroots
646
646
647 # experimental config: bundle.reorder
647 # experimental config: bundle.reorder
648 reorder = repo.ui.config('bundle', 'reorder')
648 reorder = repo.ui.config('bundle', 'reorder')
649 if reorder == 'auto':
649 if reorder == 'auto':
650 self._reorder = allowreorder
650 self._reorder = allowreorder
651 else:
651 else:
652 self._reorder = stringutil.parsebool(reorder)
652 self._reorder = stringutil.parsebool(reorder)
653
653
654 self._repo = repo
654 self._repo = repo
655
655
656 if self._repo.ui.verbose and not self._repo.ui.debugflag:
656 if self._repo.ui.verbose and not self._repo.ui.debugflag:
657 self._verbosenote = self._repo.ui.note
657 self._verbosenote = self._repo.ui.note
658 else:
658 else:
659 self._verbosenote = lambda s: None
659 self._verbosenote = lambda s: None
660
660
661 # Maps CL revs to per-revlog revisions. Cleared in close() at
661 # Maps CL revs to per-revlog revisions. Cleared in close() at
662 # the end of each group.
662 # the end of each group.
663 self._clrevtolocalrev = {}
663 self._clrevtolocalrev = {}
664 self._nextclrevtolocalrev = {}
665
664
666 def _close(self):
665 def _close(self):
667 # Ellipses serving mode.
666 # Ellipses serving mode.
668 self._clrevtolocalrev.clear()
667 self._clrevtolocalrev.clear()
669 if self._nextclrevtolocalrev is not None:
670 self._clrevtolocalrev = self._nextclrevtolocalrev
671 self._nextclrevtolocalrev = None
672
668
673 return closechunk()
669 return closechunk()
674
670
675 def group(self, revs, store, ischangelog, lookup, units=None):
671 def group(self, revs, store, ischangelog, lookup, units=None):
676 """Calculate a delta group, yielding a sequence of changegroup chunks
672 """Calculate a delta group, yielding a sequence of changegroup chunks
677 (strings).
673 (strings).
678
674
679 Given a list of changeset revs, return a set of deltas and
675 Given a list of changeset revs, return a set of deltas and
680 metadata corresponding to nodes. The first delta is
676 metadata corresponding to nodes. The first delta is
681 first parent(nodelist[0]) -> nodelist[0], the receiver is
677 first parent(nodelist[0]) -> nodelist[0], the receiver is
682 guaranteed to have this parent as it has all history before
678 guaranteed to have this parent as it has all history before
683 these changesets. In the case firstparent is nullrev the
679 these changesets. In the case firstparent is nullrev the
684 changegroup starts with a full revision.
680 changegroup starts with a full revision.
685
681
686 If units is not None, progress detail will be generated, units specifies
682 If units is not None, progress detail will be generated, units specifies
687 the type of revlog that is touched (changelog, manifest, etc.).
683 the type of revlog that is touched (changelog, manifest, etc.).
688 """
684 """
689 # if we don't have any revisions touched by these changesets, bail
685 # if we don't have any revisions touched by these changesets, bail
690 if len(revs) == 0:
686 if len(revs) == 0:
691 yield self._close()
687 yield self._close()
692 return
688 return
693
689
694 cl = self._repo.changelog
690 cl = self._repo.changelog
695
691
696 # add the parent of the first rev
692 # add the parent of the first rev
697 p = store.parentrevs(revs[0])[0]
693 p = store.parentrevs(revs[0])[0]
698 revs.insert(0, p)
694 revs.insert(0, p)
699
695
700 # build deltas
696 # build deltas
701 progress = None
697 progress = None
702 if units is not None:
698 if units is not None:
703 progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
699 progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
704 total=(len(revs) - 1))
700 total=(len(revs) - 1))
705 for r in pycompat.xrange(len(revs) - 1):
701 for r in pycompat.xrange(len(revs) - 1):
706 if progress:
702 if progress:
707 progress.update(r + 1)
703 progress.update(r + 1)
708 prev, curr = revs[r], revs[r + 1]
704 prev, curr = revs[r], revs[r + 1]
709 linknode = lookup(store.node(curr))
705 linknode = lookup(store.node(curr))
710
706
711 if self._ellipses:
707 if self._ellipses:
712 linkrev = cl.rev(linknode)
708 linkrev = cl.rev(linknode)
713 self._clrevtolocalrev[linkrev] = curr
709 self._clrevtolocalrev[linkrev] = curr
714
710
715 # This is a node to send in full, because the changeset it
711 # This is a node to send in full, because the changeset it
716 # corresponds to was a full changeset.
712 # corresponds to was a full changeset.
717 if linknode in self._fullclnodes:
713 if linknode in self._fullclnodes:
718 delta = _revisiondeltanormal(store, curr, prev, linknode,
714 delta = _revisiondeltanormal(store, curr, prev, linknode,
719 self._deltaparentfn)
715 self._deltaparentfn)
720 elif linkrev not in self._precomputedellipsis:
716 elif linkrev not in self._precomputedellipsis:
721 delta = None
717 delta = None
722 else:
718 else:
723 delta = self._revisiondeltanarrow(store, ischangelog,
719 delta = self._revisiondeltanarrow(store, ischangelog,
724 curr, linkrev, linknode)
720 curr, linkrev, linknode)
725 else:
721 else:
726 delta = _revisiondeltanormal(store, curr, prev, linknode,
722 delta = _revisiondeltanormal(store, curr, prev, linknode,
727 self._deltaparentfn)
723 self._deltaparentfn)
728
724
729 if not delta:
725 if not delta:
730 continue
726 continue
731
727
732 meta = self._builddeltaheader(delta)
728 meta = self._builddeltaheader(delta)
733 l = len(meta) + sum(len(x) for x in delta.deltachunks)
729 l = len(meta) + sum(len(x) for x in delta.deltachunks)
734 yield chunkheader(l)
730 yield chunkheader(l)
735 yield meta
731 yield meta
736 for x in delta.deltachunks:
732 for x in delta.deltachunks:
737 yield x
733 yield x
738
734
739 if progress:
735 if progress:
740 progress.complete()
736 progress.complete()
741 yield self._close()
737 yield self._close()
742
738
743 # filter any nodes that claim to be part of the known set
739 # filter any nodes that claim to be part of the known set
744 def _prune(self, store, missing, commonrevs):
740 def _prune(self, store, missing, commonrevs):
745 # TODO this violates storage abstraction for manifests.
741 # TODO this violates storage abstraction for manifests.
746 if isinstance(store, manifest.manifestrevlog):
742 if isinstance(store, manifest.manifestrevlog):
747 if not self._filematcher.visitdir(store._dir[:-1] or '.'):
743 if not self._filematcher.visitdir(store._dir[:-1] or '.'):
748 return []
744 return []
749
745
750 rr, rl = store.rev, store.linkrev
746 rr, rl = store.rev, store.linkrev
751 return [n for n in missing if rl(rr(n)) not in commonrevs]
747 return [n for n in missing if rl(rr(n)) not in commonrevs]
752
748
753 def _packmanifests(self, dir, dirlog, revs, lookuplinknode):
749 def _packmanifests(self, dir, dirlog, revs, lookuplinknode):
754 """Pack manifests into a changegroup stream.
750 """Pack manifests into a changegroup stream.
755
751
756 Encodes the directory name in the output so multiple manifests
752 Encodes the directory name in the output so multiple manifests
757 can be sent. Multiple manifests is not supported by cg1 and cg2.
753 can be sent. Multiple manifests is not supported by cg1 and cg2.
758 """
754 """
759 if dir:
755 if dir:
760 assert self.version == b'03'
756 assert self.version == b'03'
761 yield _fileheader(dir)
757 yield _fileheader(dir)
762
758
763 for chunk in self.group(revs, dirlog, False, lookuplinknode,
759 for chunk in self.group(revs, dirlog, False, lookuplinknode,
764 units=_('manifests')):
760 units=_('manifests')):
765 yield chunk
761 yield chunk
766
762
767 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
763 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
768 """Yield a sequence of changegroup byte chunks."""
764 """Yield a sequence of changegroup byte chunks."""
769
765
770 repo = self._repo
766 repo = self._repo
771 cl = repo.changelog
767 cl = repo.changelog
772
768
773 self._verbosenote(_('uncompressed size of bundle content:\n'))
769 self._verbosenote(_('uncompressed size of bundle content:\n'))
774 size = 0
770 size = 0
775
771
776 clstate, chunks = self._generatechangelog(cl, clnodes)
772 clstate, chunks = self._generatechangelog(cl, clnodes)
777 for chunk in chunks:
773 for chunk in chunks:
778 size += len(chunk)
774 size += len(chunk)
779 yield chunk
775 yield chunk
780
776
781 self._verbosenote(_('%8.i (changelog)\n') % size)
777 self._verbosenote(_('%8.i (changelog)\n') % size)
782
778
783 clrevorder = clstate['clrevorder']
779 clrevorder = clstate['clrevorder']
784 mfs = clstate['mfs']
780 mfs = clstate['mfs']
785 changedfiles = clstate['changedfiles']
781 changedfiles = clstate['changedfiles']
786
782
783 if self._ellipses:
784 self._clrevtolocalrev = clstate['clrevtomanifestrev']
785
787 # We need to make sure that the linkrev in the changegroup refers to
786 # We need to make sure that the linkrev in the changegroup refers to
788 # the first changeset that introduced the manifest or file revision.
787 # the first changeset that introduced the manifest or file revision.
789 # The fastpath is usually safer than the slowpath, because the filelogs
788 # The fastpath is usually safer than the slowpath, because the filelogs
790 # are walked in revlog order.
789 # are walked in revlog order.
791 #
790 #
792 # When taking the slowpath with reorder=None and the manifest revlog
791 # When taking the slowpath with reorder=None and the manifest revlog
793 # uses generaldelta, the manifest may be walked in the "wrong" order.
792 # uses generaldelta, the manifest may be walked in the "wrong" order.
794 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
793 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
795 # cc0ff93d0c0c).
794 # cc0ff93d0c0c).
796 #
795 #
797 # When taking the fastpath, we are only vulnerable to reordering
796 # When taking the fastpath, we are only vulnerable to reordering
798 # of the changelog itself. The changelog never uses generaldelta, so
797 # of the changelog itself. The changelog never uses generaldelta, so
799 # it is only reordered when reorder=True. To handle this case, we
798 # it is only reordered when reorder=True. To handle this case, we
800 # simply take the slowpath, which already has the 'clrevorder' logic.
799 # simply take the slowpath, which already has the 'clrevorder' logic.
801 # This was also fixed in cc0ff93d0c0c.
800 # This was also fixed in cc0ff93d0c0c.
802 fastpathlinkrev = fastpathlinkrev and not self._reorder
801 fastpathlinkrev = fastpathlinkrev and not self._reorder
803 # Treemanifests don't work correctly with fastpathlinkrev
802 # Treemanifests don't work correctly with fastpathlinkrev
804 # either, because we don't discover which directory nodes to
803 # either, because we don't discover which directory nodes to
805 # send along with files. This could probably be fixed.
804 # send along with files. This could probably be fixed.
806 fastpathlinkrev = fastpathlinkrev and (
805 fastpathlinkrev = fastpathlinkrev and (
807 'treemanifest' not in repo.requirements)
806 'treemanifest' not in repo.requirements)
808
807
809 fnodes = {} # needed file nodes
808 fnodes = {} # needed file nodes
810
809
811 for chunk in self.generatemanifests(commonrevs, clrevorder,
810 for chunk in self.generatemanifests(commonrevs, clrevorder,
812 fastpathlinkrev, mfs, fnodes, source):
811 fastpathlinkrev, mfs, fnodes, source):
813 yield chunk
812 yield chunk
814
813
815 mfdicts = None
814 mfdicts = None
816 if self._ellipses and self._isshallow:
815 if self._ellipses and self._isshallow:
817 mfdicts = [(self._repo.manifestlog[n].read(), lr)
816 mfdicts = [(self._repo.manifestlog[n].read(), lr)
818 for (n, lr) in mfs.iteritems()]
817 for (n, lr) in mfs.iteritems()]
819
818
820 mfs.clear()
819 mfs.clear()
821 clrevs = set(cl.rev(x) for x in clnodes)
820 clrevs = set(cl.rev(x) for x in clnodes)
822
821
823 if not fastpathlinkrev:
822 if not fastpathlinkrev:
824 def linknodes(unused, fname):
823 def linknodes(unused, fname):
825 return fnodes.get(fname, {})
824 return fnodes.get(fname, {})
826 else:
825 else:
827 cln = cl.node
826 cln = cl.node
828 def linknodes(filerevlog, fname):
827 def linknodes(filerevlog, fname):
829 llr = filerevlog.linkrev
828 llr = filerevlog.linkrev
830 fln = filerevlog.node
829 fln = filerevlog.node
831 revs = ((r, llr(r)) for r in filerevlog)
830 revs = ((r, llr(r)) for r in filerevlog)
832 return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
831 return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
833
832
834 for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
833 for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
835 source, mfdicts):
834 source, mfdicts):
836 yield chunk
835 yield chunk
837
836
838 yield self._close()
837 yield self._close()
839
838
840 if clnodes:
839 if clnodes:
841 repo.hook('outgoing', node=hex(clnodes[0]), source=source)
840 repo.hook('outgoing', node=hex(clnodes[0]), source=source)
842
841
843 def _generatechangelog(self, cl, nodes):
842 def _generatechangelog(self, cl, nodes):
844 """Generate data for changelog chunks.
843 """Generate data for changelog chunks.
845
844
846 Returns a 2-tuple of a dict containing state and an iterable of
845 Returns a 2-tuple of a dict containing state and an iterable of
847 byte chunks. The state will not be fully populated until the
846 byte chunks. The state will not be fully populated until the
848 chunk stream has been fully consumed.
847 chunk stream has been fully consumed.
849 """
848 """
850 clrevorder = {}
849 clrevorder = {}
851 mfs = {} # needed manifests
850 mfs = {} # needed manifests
852 mfl = self._repo.manifestlog
851 mfl = self._repo.manifestlog
853 # TODO violates storage abstraction.
852 # TODO violates storage abstraction.
854 mfrevlog = mfl._revlog
853 mfrevlog = mfl._revlog
855 changedfiles = set()
854 changedfiles = set()
855 clrevtomanifestrev = {}
856
856
857 # Callback for the changelog, used to collect changed files and
857 # Callback for the changelog, used to collect changed files and
858 # manifest nodes.
858 # manifest nodes.
859 # Returns the linkrev node (identity in the changelog case).
859 # Returns the linkrev node (identity in the changelog case).
860 def lookupcl(x):
860 def lookupcl(x):
861 c = cl.read(x)
861 c = cl.read(x)
862 clrevorder[x] = len(clrevorder)
862 clrevorder[x] = len(clrevorder)
863
863
864 if self._ellipses:
864 if self._ellipses:
865 # Only update mfs if x is going to be sent. Otherwise we
865 # Only update mfs if x is going to be sent. Otherwise we
866 # end up with bogus linkrevs specified for manifests and
866 # end up with bogus linkrevs specified for manifests and
867 # we skip some manifest nodes that we should otherwise
867 # we skip some manifest nodes that we should otherwise
868 # have sent.
868 # have sent.
869 if (x in self._fullclnodes
869 if (x in self._fullclnodes
870 or cl.rev(x) in self._precomputedellipsis):
870 or cl.rev(x) in self._precomputedellipsis):
871 n = c[0]
871 n = c[0]
872 # Record the first changeset introducing this manifest
872 # Record the first changeset introducing this manifest
873 # version.
873 # version.
874 mfs.setdefault(n, x)
874 mfs.setdefault(n, x)
875 # Set this narrow-specific dict so we have the lowest
875 # Set this narrow-specific dict so we have the lowest
876 # manifest revnum to look up for this cl revnum. (Part of
876 # manifest revnum to look up for this cl revnum. (Part of
877 # mapping changelog ellipsis parents to manifest ellipsis
877 # mapping changelog ellipsis parents to manifest ellipsis
878 # parents)
878 # parents)
879 self._nextclrevtolocalrev.setdefault(cl.rev(x),
879 clrevtomanifestrev.setdefault(cl.rev(x), mfrevlog.rev(n))
880 mfrevlog.rev(n))
881 # We can't trust the changed files list in the changeset if the
880 # We can't trust the changed files list in the changeset if the
882 # client requested a shallow clone.
881 # client requested a shallow clone.
883 if self._isshallow:
882 if self._isshallow:
884 changedfiles.update(mfl[c[0]].read().keys())
883 changedfiles.update(mfl[c[0]].read().keys())
885 else:
884 else:
886 changedfiles.update(c[3])
885 changedfiles.update(c[3])
887 else:
886 else:
888
887
889 n = c[0]
888 n = c[0]
890 # record the first changeset introducing this manifest version
889 # record the first changeset introducing this manifest version
891 mfs.setdefault(n, x)
890 mfs.setdefault(n, x)
892 # Record a complete list of potentially-changed files in
891 # Record a complete list of potentially-changed files in
893 # this manifest.
892 # this manifest.
894 changedfiles.update(c[3])
893 changedfiles.update(c[3])
895
894
896 return x
895 return x
897
896
898 # Changelog doesn't benefit from reordering revisions. So send out
897 # Changelog doesn't benefit from reordering revisions. So send out
899 # revisions in store order.
898 # revisions in store order.
900 revs = sorted(cl.rev(n) for n in nodes)
899 revs = sorted(cl.rev(n) for n in nodes)
901
900
902 state = {
901 state = {
903 'clrevorder': clrevorder,
902 'clrevorder': clrevorder,
904 'mfs': mfs,
903 'mfs': mfs,
905 'changedfiles': changedfiles,
904 'changedfiles': changedfiles,
905 'clrevtomanifestrev': clrevtomanifestrev,
906 }
906 }
907
907
908 gen = self.group(revs, cl, True, lookupcl, units=_('changesets'))
908 gen = self.group(revs, cl, True, lookupcl, units=_('changesets'))
909
909
910 return state, gen
910 return state, gen
911
911
912 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
912 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
913 fnodes, source):
913 fnodes, source):
914 """Returns an iterator of changegroup chunks containing manifests.
914 """Returns an iterator of changegroup chunks containing manifests.
915
915
916 `source` is unused here, but is used by extensions like remotefilelog to
916 `source` is unused here, but is used by extensions like remotefilelog to
917 change what is sent based in pulls vs pushes, etc.
917 change what is sent based in pulls vs pushes, etc.
918 """
918 """
919 repo = self._repo
919 repo = self._repo
920 cl = repo.changelog
920 cl = repo.changelog
921 mfl = repo.manifestlog
921 mfl = repo.manifestlog
922 dirlog = mfl._revlog.dirlog
922 dirlog = mfl._revlog.dirlog
923 tmfnodes = {'': mfs}
923 tmfnodes = {'': mfs}
924
924
925 # Callback for the manifest, used to collect linkrevs for filelog
925 # Callback for the manifest, used to collect linkrevs for filelog
926 # revisions.
926 # revisions.
927 # Returns the linkrev node (collected in lookupcl).
927 # Returns the linkrev node (collected in lookupcl).
928 def makelookupmflinknode(dir, nodes):
928 def makelookupmflinknode(dir, nodes):
929 if fastpathlinkrev:
929 if fastpathlinkrev:
930 assert not dir
930 assert not dir
931 return mfs.__getitem__
931 return mfs.__getitem__
932
932
933 def lookupmflinknode(x):
933 def lookupmflinknode(x):
934 """Callback for looking up the linknode for manifests.
934 """Callback for looking up the linknode for manifests.
935
935
936 Returns the linkrev node for the specified manifest.
936 Returns the linkrev node for the specified manifest.
937
937
938 SIDE EFFECT:
938 SIDE EFFECT:
939
939
940 1) fclnodes gets populated with the list of relevant
940 1) fclnodes gets populated with the list of relevant
941 file nodes if we're not using fastpathlinkrev
941 file nodes if we're not using fastpathlinkrev
942 2) When treemanifests are in use, collects treemanifest nodes
942 2) When treemanifests are in use, collects treemanifest nodes
943 to send
943 to send
944
944
945 Note that this means manifests must be completely sent to
945 Note that this means manifests must be completely sent to
946 the client before you can trust the list of files and
946 the client before you can trust the list of files and
947 treemanifests to send.
947 treemanifests to send.
948 """
948 """
949 clnode = nodes[x]
949 clnode = nodes[x]
950 mdata = mfl.get(dir, x).readfast(shallow=True)
950 mdata = mfl.get(dir, x).readfast(shallow=True)
951 for p, n, fl in mdata.iterentries():
951 for p, n, fl in mdata.iterentries():
952 if fl == 't': # subdirectory manifest
952 if fl == 't': # subdirectory manifest
953 subdir = dir + p + '/'
953 subdir = dir + p + '/'
954 tmfclnodes = tmfnodes.setdefault(subdir, {})
954 tmfclnodes = tmfnodes.setdefault(subdir, {})
955 tmfclnode = tmfclnodes.setdefault(n, clnode)
955 tmfclnode = tmfclnodes.setdefault(n, clnode)
956 if clrevorder[clnode] < clrevorder[tmfclnode]:
956 if clrevorder[clnode] < clrevorder[tmfclnode]:
957 tmfclnodes[n] = clnode
957 tmfclnodes[n] = clnode
958 else:
958 else:
959 f = dir + p
959 f = dir + p
960 fclnodes = fnodes.setdefault(f, {})
960 fclnodes = fnodes.setdefault(f, {})
961 fclnode = fclnodes.setdefault(n, clnode)
961 fclnode = fclnodes.setdefault(n, clnode)
962 if clrevorder[clnode] < clrevorder[fclnode]:
962 if clrevorder[clnode] < clrevorder[fclnode]:
963 fclnodes[n] = clnode
963 fclnodes[n] = clnode
964 return clnode
964 return clnode
965 return lookupmflinknode
965 return lookupmflinknode
966
966
967 size = 0
967 size = 0
968 while tmfnodes:
968 while tmfnodes:
969 dir, nodes = tmfnodes.popitem()
969 dir, nodes = tmfnodes.popitem()
970 store = dirlog(dir)
970 store = dirlog(dir)
971 prunednodes = self._prune(store, nodes, commonrevs)
971 prunednodes = self._prune(store, nodes, commonrevs)
972 if not dir or prunednodes:
972 if not dir or prunednodes:
973 lookupfn = makelookupmflinknode(dir, nodes)
973 lookupfn = makelookupmflinknode(dir, nodes)
974
974
975 if self._ellipses:
975 if self._ellipses:
976 revs = _sortnodesellipsis(store, prunednodes, cl,
976 revs = _sortnodesellipsis(store, prunednodes, cl,
977 lookupfn)
977 lookupfn)
978 else:
978 else:
979 revs = _sortnodesnormal(store, prunednodes,
979 revs = _sortnodesnormal(store, prunednodes,
980 self._reorder)
980 self._reorder)
981
981
982 for x in self._packmanifests(dir, store, revs, lookupfn):
982 for x in self._packmanifests(dir, store, revs, lookupfn):
983 size += len(x)
983 size += len(x)
984 yield x
984 yield x
985 self._verbosenote(_('%8.i (manifests)\n') % size)
985 self._verbosenote(_('%8.i (manifests)\n') % size)
986 yield self._manifestsend
986 yield self._manifestsend
987
987
988 # The 'source' parameter is useful for extensions
988 # The 'source' parameter is useful for extensions
989 def generatefiles(self, changedfiles, linknodes, commonrevs, source,
989 def generatefiles(self, changedfiles, linknodes, commonrevs, source,
990 mfdicts):
990 mfdicts):
991 changedfiles = list(filter(self._filematcher, changedfiles))
991 changedfiles = list(filter(self._filematcher, changedfiles))
992
992
993 if self._isshallow:
993 if self._isshallow:
994 # In a shallow clone, the linknodes callback needs to also include
994 # In a shallow clone, the linknodes callback needs to also include
995 # those file nodes that are in the manifests we sent but weren't
995 # those file nodes that are in the manifests we sent but weren't
996 # introduced by those manifests.
996 # introduced by those manifests.
997 commonctxs = [self._repo[c] for c in commonrevs]
997 commonctxs = [self._repo[c] for c in commonrevs]
998 oldlinknodes = linknodes
998 oldlinknodes = linknodes
999 clrev = self._repo.changelog.rev
999 clrev = self._repo.changelog.rev
1000
1000
1001 # Defining this function has a side-effect of overriding the
1001 # Defining this function has a side-effect of overriding the
1002 # function of the same name that was passed in as an argument.
1002 # function of the same name that was passed in as an argument.
1003 # TODO have caller pass in appropriate function.
1003 # TODO have caller pass in appropriate function.
1004 def linknodes(flog, fname):
1004 def linknodes(flog, fname):
1005 for c in commonctxs:
1005 for c in commonctxs:
1006 try:
1006 try:
1007 fnode = c.filenode(fname)
1007 fnode = c.filenode(fname)
1008 self._clrevtolocalrev[c.rev()] = flog.rev(fnode)
1008 self._clrevtolocalrev[c.rev()] = flog.rev(fnode)
1009 except error.ManifestLookupError:
1009 except error.ManifestLookupError:
1010 pass
1010 pass
1011 links = oldlinknodes(flog, fname)
1011 links = oldlinknodes(flog, fname)
1012 if len(links) != len(mfdicts):
1012 if len(links) != len(mfdicts):
1013 for mf, lr in mfdicts:
1013 for mf, lr in mfdicts:
1014 fnode = mf.get(fname, None)
1014 fnode = mf.get(fname, None)
1015 if fnode in links:
1015 if fnode in links:
1016 links[fnode] = min(links[fnode], lr, key=clrev)
1016 links[fnode] = min(links[fnode], lr, key=clrev)
1017 elif fnode:
1017 elif fnode:
1018 links[fnode] = lr
1018 links[fnode] = lr
1019 return links
1019 return links
1020
1020
1021 return self._generatefiles(changedfiles, linknodes, commonrevs, source)
1021 return self._generatefiles(changedfiles, linknodes, commonrevs, source)
1022
1022
1023 def _generatefiles(self, changedfiles, linknodes, commonrevs, source):
1023 def _generatefiles(self, changedfiles, linknodes, commonrevs, source):
1024 repo = self._repo
1024 repo = self._repo
1025 cl = repo.changelog
1025 cl = repo.changelog
1026 progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
1026 progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
1027 total=len(changedfiles))
1027 total=len(changedfiles))
1028 for i, fname in enumerate(sorted(changedfiles)):
1028 for i, fname in enumerate(sorted(changedfiles)):
1029 filerevlog = repo.file(fname)
1029 filerevlog = repo.file(fname)
1030 if not filerevlog:
1030 if not filerevlog:
1031 raise error.Abort(_("empty or missing file data for %s") %
1031 raise error.Abort(_("empty or missing file data for %s") %
1032 fname)
1032 fname)
1033
1033
1034 linkrevnodes = linknodes(filerevlog, fname)
1034 linkrevnodes = linknodes(filerevlog, fname)
1035 # Lookup for filenodes, we collected the linkrev nodes above in the
1035 # Lookup for filenodes, we collected the linkrev nodes above in the
1036 # fastpath case and with lookupmf in the slowpath case.
1036 # fastpath case and with lookupmf in the slowpath case.
1037 def lookupfilelog(x):
1037 def lookupfilelog(x):
1038 return linkrevnodes[x]
1038 return linkrevnodes[x]
1039
1039
1040 filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)
1040 filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)
1041 if filenodes:
1041 if filenodes:
1042 if self._ellipses:
1042 if self._ellipses:
1043 revs = _sortnodesellipsis(filerevlog, filenodes,
1043 revs = _sortnodesellipsis(filerevlog, filenodes,
1044 cl, lookupfilelog)
1044 cl, lookupfilelog)
1045 else:
1045 else:
1046 revs = _sortnodesnormal(filerevlog, filenodes,
1046 revs = _sortnodesnormal(filerevlog, filenodes,
1047 self._reorder)
1047 self._reorder)
1048
1048
1049 progress.update(i + 1, item=fname)
1049 progress.update(i + 1, item=fname)
1050 h = _fileheader(fname)
1050 h = _fileheader(fname)
1051 size = len(h)
1051 size = len(h)
1052 yield h
1052 yield h
1053 for chunk in self.group(revs, filerevlog, False, lookupfilelog):
1053 for chunk in self.group(revs, filerevlog, False, lookupfilelog):
1054 size += len(chunk)
1054 size += len(chunk)
1055 yield chunk
1055 yield chunk
1056 self._verbosenote(_('%8.i %s\n') % (size, fname))
1056 self._verbosenote(_('%8.i %s\n') % (size, fname))
1057 progress.complete()
1057 progress.complete()
1058
1058
1059 def _revisiondeltanarrow(self, store, ischangelog, rev, linkrev, linknode):
1059 def _revisiondeltanarrow(self, store, ischangelog, rev, linkrev, linknode):
1060 linkparents = self._precomputedellipsis[linkrev]
1060 linkparents = self._precomputedellipsis[linkrev]
1061 def local(clrev):
1061 def local(clrev):
1062 """Turn a changelog revnum into a local revnum.
1062 """Turn a changelog revnum into a local revnum.
1063
1063
1064 The ellipsis dag is stored as revnums on the changelog,
1064 The ellipsis dag is stored as revnums on the changelog,
1065 but when we're producing ellipsis entries for
1065 but when we're producing ellipsis entries for
1066 non-changelog revlogs, we need to turn those numbers into
1066 non-changelog revlogs, we need to turn those numbers into
1067 something local. This does that for us, and during the
1067 something local. This does that for us, and during the
1068 changelog sending phase will also expand the stored
1068 changelog sending phase will also expand the stored
1069 mappings as needed.
1069 mappings as needed.
1070 """
1070 """
1071 if clrev == nullrev:
1071 if clrev == nullrev:
1072 return nullrev
1072 return nullrev
1073
1073
1074 if ischangelog:
1074 if ischangelog:
1075 return clrev
1075 return clrev
1076
1076
1077 # Walk the ellipsis-ized changelog breadth-first looking for a
1077 # Walk the ellipsis-ized changelog breadth-first looking for a
1078 # change that has been linked from the current revlog.
1078 # change that has been linked from the current revlog.
1079 #
1079 #
1080 # For a flat manifest revlog only a single step should be necessary
1080 # For a flat manifest revlog only a single step should be necessary
1081 # as all relevant changelog entries are relevant to the flat
1081 # as all relevant changelog entries are relevant to the flat
1082 # manifest.
1082 # manifest.
1083 #
1083 #
1084 # For a filelog or tree manifest dirlog however not every changelog
1084 # For a filelog or tree manifest dirlog however not every changelog
1085 # entry will have been relevant, so we need to skip some changelog
1085 # entry will have been relevant, so we need to skip some changelog
1086 # nodes even after ellipsis-izing.
1086 # nodes even after ellipsis-izing.
1087 walk = [clrev]
1087 walk = [clrev]
1088 while walk:
1088 while walk:
1089 p = walk[0]
1089 p = walk[0]
1090 walk = walk[1:]
1090 walk = walk[1:]
1091 if p in self._clrevtolocalrev:
1091 if p in self._clrevtolocalrev:
1092 return self._clrevtolocalrev[p]
1092 return self._clrevtolocalrev[p]
1093 elif p in self._fullclnodes:
1093 elif p in self._fullclnodes:
1094 walk.extend([pp for pp in self._repo.changelog.parentrevs(p)
1094 walk.extend([pp for pp in self._repo.changelog.parentrevs(p)
1095 if pp != nullrev])
1095 if pp != nullrev])
1096 elif p in self._precomputedellipsis:
1096 elif p in self._precomputedellipsis:
1097 walk.extend([pp for pp in self._precomputedellipsis[p]
1097 walk.extend([pp for pp in self._precomputedellipsis[p]
1098 if pp != nullrev])
1098 if pp != nullrev])
1099 else:
1099 else:
1100 # In this case, we've got an ellipsis with parents
1100 # In this case, we've got an ellipsis with parents
1101 # outside the current bundle (likely an
1101 # outside the current bundle (likely an
1102 # incremental pull). We "know" that we can use the
1102 # incremental pull). We "know" that we can use the
1103 # value of this same revlog at whatever revision
1103 # value of this same revlog at whatever revision
1104 # is pointed to by linknode. "Know" is in scare
1104 # is pointed to by linknode. "Know" is in scare
1105 # quotes because I haven't done enough examination
1105 # quotes because I haven't done enough examination
1106 # of edge cases to convince myself this is really
1106 # of edge cases to convince myself this is really
1107 # a fact - it works for all the (admittedly
1107 # a fact - it works for all the (admittedly
1108 # thorough) cases in our testsuite, but I would be
1108 # thorough) cases in our testsuite, but I would be
1109 # somewhat unsurprised to find a case in the wild
1109 # somewhat unsurprised to find a case in the wild
1110 # where this breaks down a bit. That said, I don't
1110 # where this breaks down a bit. That said, I don't
1111 # know if it would hurt anything.
1111 # know if it would hurt anything.
1112 for i in pycompat.xrange(rev, 0, -1):
1112 for i in pycompat.xrange(rev, 0, -1):
1113 if store.linkrev(i) == clrev:
1113 if store.linkrev(i) == clrev:
1114 return i
1114 return i
1115 # We failed to resolve a parent for this node, so
1115 # We failed to resolve a parent for this node, so
1116 # we crash the changegroup construction.
1116 # we crash the changegroup construction.
1117 raise error.Abort(
1117 raise error.Abort(
1118 'unable to resolve parent while packing %r %r'
1118 'unable to resolve parent while packing %r %r'
1119 ' for changeset %r' % (store.indexfile, rev, clrev))
1119 ' for changeset %r' % (store.indexfile, rev, clrev))
1120
1120
1121 return nullrev
1121 return nullrev
1122
1122
1123 if not linkparents or (
1123 if not linkparents or (
1124 store.parentrevs(rev) == (nullrev, nullrev)):
1124 store.parentrevs(rev) == (nullrev, nullrev)):
1125 p1, p2 = nullrev, nullrev
1125 p1, p2 = nullrev, nullrev
1126 elif len(linkparents) == 1:
1126 elif len(linkparents) == 1:
1127 p1, = sorted(local(p) for p in linkparents)
1127 p1, = sorted(local(p) for p in linkparents)
1128 p2 = nullrev
1128 p2 = nullrev
1129 else:
1129 else:
1130 p1, p2 = sorted(local(p) for p in linkparents)
1130 p1, p2 = sorted(local(p) for p in linkparents)
1131
1131
1132 n = store.node(rev)
1132 n = store.node(rev)
1133 p1n, p2n = store.node(p1), store.node(p2)
1133 p1n, p2n = store.node(p1), store.node(p2)
1134 flags = store.flags(rev)
1134 flags = store.flags(rev)
1135 flags |= revlog.REVIDX_ELLIPSIS
1135 flags |= revlog.REVIDX_ELLIPSIS
1136
1136
1137 # TODO: try and actually send deltas for ellipsis data blocks
1137 # TODO: try and actually send deltas for ellipsis data blocks
1138 data = store.revision(n)
1138 data = store.revision(n)
1139 diffheader = mdiff.trivialdiffheader(len(data))
1139 diffheader = mdiff.trivialdiffheader(len(data))
1140
1140
1141 return revisiondelta(
1141 return revisiondelta(
1142 node=n,
1142 node=n,
1143 p1node=p1n,
1143 p1node=p1n,
1144 p2node=p2n,
1144 p2node=p2n,
1145 basenode=nullid,
1145 basenode=nullid,
1146 linknode=linknode,
1146 linknode=linknode,
1147 flags=flags,
1147 flags=flags,
1148 deltachunks=(diffheader, data),
1148 deltachunks=(diffheader, data),
1149 )
1149 )
1150
1150
1151 def _deltaparentprev(store, rev, p1, p2, prev):
1151 def _deltaparentprev(store, rev, p1, p2, prev):
1152 """Resolve a delta parent to the previous revision.
1152 """Resolve a delta parent to the previous revision.
1153
1153
1154 Used for version 1 changegroups, which don't support generaldelta.
1154 Used for version 1 changegroups, which don't support generaldelta.
1155 """
1155 """
1156 return prev
1156 return prev
1157
1157
1158 def _deltaparentgeneraldelta(store, rev, p1, p2, prev):
1158 def _deltaparentgeneraldelta(store, rev, p1, p2, prev):
1159 """Resolve a delta parent when general deltas are supported."""
1159 """Resolve a delta parent when general deltas are supported."""
1160 dp = store.deltaparent(rev)
1160 dp = store.deltaparent(rev)
1161 if dp == nullrev and store.storedeltachains:
1161 if dp == nullrev and store.storedeltachains:
1162 # Avoid sending full revisions when delta parent is null. Pick prev
1162 # Avoid sending full revisions when delta parent is null. Pick prev
1163 # in that case. It's tempting to pick p1 in this case, as p1 will
1163 # in that case. It's tempting to pick p1 in this case, as p1 will
1164 # be smaller in the common case. However, computing a delta against
1164 # be smaller in the common case. However, computing a delta against
1165 # p1 may require resolving the raw text of p1, which could be
1165 # p1 may require resolving the raw text of p1, which could be
1166 # expensive. The revlog caches should have prev cached, meaning
1166 # expensive. The revlog caches should have prev cached, meaning
1167 # less CPU for changegroup generation. There is likely room to add
1167 # less CPU for changegroup generation. There is likely room to add
1168 # a flag and/or config option to control this behavior.
1168 # a flag and/or config option to control this behavior.
1169 base = prev
1169 base = prev
1170 elif dp == nullrev:
1170 elif dp == nullrev:
1171 # revlog is configured to use full snapshot for a reason,
1171 # revlog is configured to use full snapshot for a reason,
1172 # stick to full snapshot.
1172 # stick to full snapshot.
1173 base = nullrev
1173 base = nullrev
1174 elif dp not in (p1, p2, prev):
1174 elif dp not in (p1, p2, prev):
1175 # Pick prev when we can't be sure remote has the base revision.
1175 # Pick prev when we can't be sure remote has the base revision.
1176 return prev
1176 return prev
1177 else:
1177 else:
1178 base = dp
1178 base = dp
1179
1179
1180 if base != nullrev and not store.candelta(base, rev):
1180 if base != nullrev and not store.candelta(base, rev):
1181 base = nullrev
1181 base = nullrev
1182
1182
1183 return base
1183 return base
1184
1184
1185 def _deltaparentellipses(store, rev, p1, p2, prev):
1185 def _deltaparentellipses(store, rev, p1, p2, prev):
1186 """Resolve a delta parent when in ellipses mode."""
1186 """Resolve a delta parent when in ellipses mode."""
1187 # TODO: send better deltas when in narrow mode.
1187 # TODO: send better deltas when in narrow mode.
1188 #
1188 #
1189 # changegroup.group() loops over revisions to send,
1189 # changegroup.group() loops over revisions to send,
1190 # including revisions we'll skip. What this means is that
1190 # including revisions we'll skip. What this means is that
1191 # `prev` will be a potentially useless delta base for all
1191 # `prev` will be a potentially useless delta base for all
1192 # ellipsis nodes, as the client likely won't have it. In
1192 # ellipsis nodes, as the client likely won't have it. In
1193 # the future we should do bookkeeping about which nodes
1193 # the future we should do bookkeeping about which nodes
1194 # have been sent to the client, and try to be
1194 # have been sent to the client, and try to be
1195 # significantly smarter about delta bases. This is
1195 # significantly smarter about delta bases. This is
1196 # slightly tricky because this same code has to work for
1196 # slightly tricky because this same code has to work for
1197 # all revlogs, and we don't have the linkrev/linknode here.
1197 # all revlogs, and we don't have the linkrev/linknode here.
1198 return p1
1198 return p1
1199
1199
1200 def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,
1200 def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,
1201 shallow=False, ellipsisroots=None, fullnodes=None):
1201 shallow=False, ellipsisroots=None, fullnodes=None):
1202 builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(
1202 builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(
1203 d.node, d.p1node, d.p2node, d.linknode)
1203 d.node, d.p1node, d.p2node, d.linknode)
1204
1204
1205 return cgpacker(repo, filematcher, b'01',
1205 return cgpacker(repo, filematcher, b'01',
1206 deltaparentfn=_deltaparentprev,
1206 deltaparentfn=_deltaparentprev,
1207 allowreorder=None,
1207 allowreorder=None,
1208 builddeltaheader=builddeltaheader,
1208 builddeltaheader=builddeltaheader,
1209 manifestsend=b'',
1209 manifestsend=b'',
1210 bundlecaps=bundlecaps,
1210 bundlecaps=bundlecaps,
1211 ellipses=ellipses,
1211 ellipses=ellipses,
1212 shallow=shallow,
1212 shallow=shallow,
1213 ellipsisroots=ellipsisroots,
1213 ellipsisroots=ellipsisroots,
1214 fullnodes=fullnodes)
1214 fullnodes=fullnodes)
1215
1215
1216 def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,
1216 def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,
1217 shallow=False, ellipsisroots=None, fullnodes=None):
1217 shallow=False, ellipsisroots=None, fullnodes=None):
1218 builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(
1218 builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(
1219 d.node, d.p1node, d.p2node, d.basenode, d.linknode)
1219 d.node, d.p1node, d.p2node, d.basenode, d.linknode)
1220
1220
1221 # Since generaldelta is directly supported by cg2, reordering
1221 # Since generaldelta is directly supported by cg2, reordering
1222 # generally doesn't help, so we disable it by default (treating
1222 # generally doesn't help, so we disable it by default (treating
1223 # bundle.reorder=auto just like bundle.reorder=False).
1223 # bundle.reorder=auto just like bundle.reorder=False).
1224 return cgpacker(repo, filematcher, b'02',
1224 return cgpacker(repo, filematcher, b'02',
1225 deltaparentfn=_deltaparentgeneraldelta,
1225 deltaparentfn=_deltaparentgeneraldelta,
1226 allowreorder=False,
1226 allowreorder=False,
1227 builddeltaheader=builddeltaheader,
1227 builddeltaheader=builddeltaheader,
1228 manifestsend=b'',
1228 manifestsend=b'',
1229 bundlecaps=bundlecaps,
1229 bundlecaps=bundlecaps,
1230 ellipses=ellipses,
1230 ellipses=ellipses,
1231 shallow=shallow,
1231 shallow=shallow,
1232 ellipsisroots=ellipsisroots,
1232 ellipsisroots=ellipsisroots,
1233 fullnodes=fullnodes)
1233 fullnodes=fullnodes)
1234
1234
1235 def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,
1235 def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,
1236 shallow=False, ellipsisroots=None, fullnodes=None):
1236 shallow=False, ellipsisroots=None, fullnodes=None):
1237 builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(
1237 builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(
1238 d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)
1238 d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)
1239
1239
1240 deltaparentfn = (_deltaparentellipses if ellipses
1240 deltaparentfn = (_deltaparentellipses if ellipses
1241 else _deltaparentgeneraldelta)
1241 else _deltaparentgeneraldelta)
1242
1242
1243 return cgpacker(repo, filematcher, b'03',
1243 return cgpacker(repo, filematcher, b'03',
1244 deltaparentfn=deltaparentfn,
1244 deltaparentfn=deltaparentfn,
1245 allowreorder=False,
1245 allowreorder=False,
1246 builddeltaheader=builddeltaheader,
1246 builddeltaheader=builddeltaheader,
1247 manifestsend=closechunk(),
1247 manifestsend=closechunk(),
1248 bundlecaps=bundlecaps,
1248 bundlecaps=bundlecaps,
1249 ellipses=ellipses,
1249 ellipses=ellipses,
1250 shallow=shallow,
1250 shallow=shallow,
1251 ellipsisroots=ellipsisroots,
1251 ellipsisroots=ellipsisroots,
1252 fullnodes=fullnodes)
1252 fullnodes=fullnodes)
1253
1253
1254 _packermap = {'01': (_makecg1packer, cg1unpacker),
1254 _packermap = {'01': (_makecg1packer, cg1unpacker),
1255 # cg2 adds support for exchanging generaldelta
1255 # cg2 adds support for exchanging generaldelta
1256 '02': (_makecg2packer, cg2unpacker),
1256 '02': (_makecg2packer, cg2unpacker),
1257 # cg3 adds support for exchanging revlog flags and treemanifests
1257 # cg3 adds support for exchanging revlog flags and treemanifests
1258 '03': (_makecg3packer, cg3unpacker),
1258 '03': (_makecg3packer, cg3unpacker),
1259 }
1259 }
1260
1260
1261 def allsupportedversions(repo):
1261 def allsupportedversions(repo):
1262 versions = set(_packermap.keys())
1262 versions = set(_packermap.keys())
1263 if not (repo.ui.configbool('experimental', 'changegroup3') or
1263 if not (repo.ui.configbool('experimental', 'changegroup3') or
1264 repo.ui.configbool('experimental', 'treemanifest') or
1264 repo.ui.configbool('experimental', 'treemanifest') or
1265 'treemanifest' in repo.requirements):
1265 'treemanifest' in repo.requirements):
1266 versions.discard('03')
1266 versions.discard('03')
1267 return versions
1267 return versions
1268
1268
1269 # Changegroup versions that can be applied to the repo
1269 # Changegroup versions that can be applied to the repo
1270 def supportedincomingversions(repo):
1270 def supportedincomingversions(repo):
1271 return allsupportedversions(repo)
1271 return allsupportedversions(repo)
1272
1272
1273 # Changegroup versions that can be created from the repo
1273 # Changegroup versions that can be created from the repo
1274 def supportedoutgoingversions(repo):
1274 def supportedoutgoingversions(repo):
1275 versions = allsupportedversions(repo)
1275 versions = allsupportedversions(repo)
1276 if 'treemanifest' in repo.requirements:
1276 if 'treemanifest' in repo.requirements:
1277 # Versions 01 and 02 support only flat manifests and it's just too
1277 # Versions 01 and 02 support only flat manifests and it's just too
1278 # expensive to convert between the flat manifest and tree manifest on
1278 # expensive to convert between the flat manifest and tree manifest on
1279 # the fly. Since tree manifests are hashed differently, all of history
1279 # the fly. Since tree manifests are hashed differently, all of history
1280 # would have to be converted. Instead, we simply don't even pretend to
1280 # would have to be converted. Instead, we simply don't even pretend to
1281 # support versions 01 and 02.
1281 # support versions 01 and 02.
1282 versions.discard('01')
1282 versions.discard('01')
1283 versions.discard('02')
1283 versions.discard('02')
1284 if repository.NARROW_REQUIREMENT in repo.requirements:
1284 if repository.NARROW_REQUIREMENT in repo.requirements:
1285 # Versions 01 and 02 don't support revlog flags, and we need to
1285 # Versions 01 and 02 don't support revlog flags, and we need to
1286 # support that for stripping and unbundling to work.
1286 # support that for stripping and unbundling to work.
1287 versions.discard('01')
1287 versions.discard('01')
1288 versions.discard('02')
1288 versions.discard('02')
1289 if LFS_REQUIREMENT in repo.requirements:
1289 if LFS_REQUIREMENT in repo.requirements:
1290 # Versions 01 and 02 don't support revlog flags, and we need to
1290 # Versions 01 and 02 don't support revlog flags, and we need to
1291 # mark LFS entries with REVIDX_EXTSTORED.
1291 # mark LFS entries with REVIDX_EXTSTORED.
1292 versions.discard('01')
1292 versions.discard('01')
1293 versions.discard('02')
1293 versions.discard('02')
1294
1294
1295 return versions
1295 return versions
1296
1296
1297 def localversion(repo):
1297 def localversion(repo):
1298 # Finds the best version to use for bundles that are meant to be used
1298 # Finds the best version to use for bundles that are meant to be used
1299 # locally, such as those from strip and shelve, and temporary bundles.
1299 # locally, such as those from strip and shelve, and temporary bundles.
1300 return max(supportedoutgoingversions(repo))
1300 return max(supportedoutgoingversions(repo))
1301
1301
1302 def safeversion(repo):
1302 def safeversion(repo):
1303 # Finds the smallest version that it's safe to assume clients of the repo
1303 # Finds the smallest version that it's safe to assume clients of the repo
1304 # will support. For example, all hg versions that support generaldelta also
1304 # will support. For example, all hg versions that support generaldelta also
1305 # support changegroup 02.
1305 # support changegroup 02.
1306 versions = supportedoutgoingversions(repo)
1306 versions = supportedoutgoingversions(repo)
1307 if 'generaldelta' in repo.requirements:
1307 if 'generaldelta' in repo.requirements:
1308 versions.discard('01')
1308 versions.discard('01')
1309 assert versions
1309 assert versions
1310 return min(versions)
1310 return min(versions)
1311
1311
1312 def getbundler(version, repo, bundlecaps=None, filematcher=None,
1312 def getbundler(version, repo, bundlecaps=None, filematcher=None,
1313 ellipses=False, shallow=False, ellipsisroots=None,
1313 ellipses=False, shallow=False, ellipsisroots=None,
1314 fullnodes=None):
1314 fullnodes=None):
1315 assert version in supportedoutgoingversions(repo)
1315 assert version in supportedoutgoingversions(repo)
1316
1316
1317 if filematcher is None:
1317 if filematcher is None:
1318 filematcher = matchmod.alwaysmatcher(repo.root, '')
1318 filematcher = matchmod.alwaysmatcher(repo.root, '')
1319
1319
1320 if version == '01' and not filematcher.always():
1320 if version == '01' and not filematcher.always():
1321 raise error.ProgrammingError('version 01 changegroups do not support '
1321 raise error.ProgrammingError('version 01 changegroups do not support '
1322 'sparse file matchers')
1322 'sparse file matchers')
1323
1323
1324 if ellipses and version in (b'01', b'02'):
1324 if ellipses and version in (b'01', b'02'):
1325 raise error.Abort(
1325 raise error.Abort(
1326 _('ellipsis nodes require at least cg3 on client and server, '
1326 _('ellipsis nodes require at least cg3 on client and server, '
1327 'but negotiated version %s') % version)
1327 'but negotiated version %s') % version)
1328
1328
1329 # Requested files could include files not in the local store. So
1329 # Requested files could include files not in the local store. So
1330 # filter those out.
1330 # filter those out.
1331 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
1331 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
1332 filematcher)
1332 filematcher)
1333
1333
1334 fn = _packermap[version][0]
1334 fn = _packermap[version][0]
1335 return fn(repo, filematcher, bundlecaps, ellipses=ellipses,
1335 return fn(repo, filematcher, bundlecaps, ellipses=ellipses,
1336 shallow=shallow, ellipsisroots=ellipsisroots,
1336 shallow=shallow, ellipsisroots=ellipsisroots,
1337 fullnodes=fullnodes)
1337 fullnodes=fullnodes)
1338
1338
1339 def getunbundler(version, fh, alg, extras=None):
1339 def getunbundler(version, fh, alg, extras=None):
1340 return _packermap[version][1](fh, alg, extras=extras)
1340 return _packermap[version][1](fh, alg, extras=extras)
1341
1341
1342 def _changegroupinfo(repo, nodes, source):
1342 def _changegroupinfo(repo, nodes, source):
1343 if repo.ui.verbose or source == 'bundle':
1343 if repo.ui.verbose or source == 'bundle':
1344 repo.ui.status(_("%d changesets found\n") % len(nodes))
1344 repo.ui.status(_("%d changesets found\n") % len(nodes))
1345 if repo.ui.debugflag:
1345 if repo.ui.debugflag:
1346 repo.ui.debug("list of changesets:\n")
1346 repo.ui.debug("list of changesets:\n")
1347 for node in nodes:
1347 for node in nodes:
1348 repo.ui.debug("%s\n" % hex(node))
1348 repo.ui.debug("%s\n" % hex(node))
1349
1349
1350 def makechangegroup(repo, outgoing, version, source, fastpath=False,
1350 def makechangegroup(repo, outgoing, version, source, fastpath=False,
1351 bundlecaps=None):
1351 bundlecaps=None):
1352 cgstream = makestream(repo, outgoing, version, source,
1352 cgstream = makestream(repo, outgoing, version, source,
1353 fastpath=fastpath, bundlecaps=bundlecaps)
1353 fastpath=fastpath, bundlecaps=bundlecaps)
1354 return getunbundler(version, util.chunkbuffer(cgstream), None,
1354 return getunbundler(version, util.chunkbuffer(cgstream), None,
1355 {'clcount': len(outgoing.missing) })
1355 {'clcount': len(outgoing.missing) })
1356
1356
1357 def makestream(repo, outgoing, version, source, fastpath=False,
1357 def makestream(repo, outgoing, version, source, fastpath=False,
1358 bundlecaps=None, filematcher=None):
1358 bundlecaps=None, filematcher=None):
1359 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
1359 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
1360 filematcher=filematcher)
1360 filematcher=filematcher)
1361
1361
1362 repo = repo.unfiltered()
1362 repo = repo.unfiltered()
1363 commonrevs = outgoing.common
1363 commonrevs = outgoing.common
1364 csets = outgoing.missing
1364 csets = outgoing.missing
1365 heads = outgoing.missingheads
1365 heads = outgoing.missingheads
1366 # We go through the fast path if we get told to, or if all (unfiltered
1366 # We go through the fast path if we get told to, or if all (unfiltered
1367 # heads have been requested (since we then know there all linkrevs will
1367 # heads have been requested (since we then know there all linkrevs will
1368 # be pulled by the client).
1368 # be pulled by the client).
1369 heads.sort()
1369 heads.sort()
1370 fastpathlinkrev = fastpath or (
1370 fastpathlinkrev = fastpath or (
1371 repo.filtername is None and heads == sorted(repo.heads()))
1371 repo.filtername is None and heads == sorted(repo.heads()))
1372
1372
1373 repo.hook('preoutgoing', throw=True, source=source)
1373 repo.hook('preoutgoing', throw=True, source=source)
1374 _changegroupinfo(repo, csets, source)
1374 _changegroupinfo(repo, csets, source)
1375 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
1375 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
1376
1376
1377 def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
1377 def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
1378 revisions = 0
1378 revisions = 0
1379 files = 0
1379 files = 0
1380 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
1380 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
1381 total=expectedfiles)
1381 total=expectedfiles)
1382 for chunkdata in iter(source.filelogheader, {}):
1382 for chunkdata in iter(source.filelogheader, {}):
1383 files += 1
1383 files += 1
1384 f = chunkdata["filename"]
1384 f = chunkdata["filename"]
1385 repo.ui.debug("adding %s revisions\n" % f)
1385 repo.ui.debug("adding %s revisions\n" % f)
1386 progress.increment()
1386 progress.increment()
1387 fl = repo.file(f)
1387 fl = repo.file(f)
1388 o = len(fl)
1388 o = len(fl)
1389 try:
1389 try:
1390 deltas = source.deltaiter()
1390 deltas = source.deltaiter()
1391 if not fl.addgroup(deltas, revmap, trp):
1391 if not fl.addgroup(deltas, revmap, trp):
1392 raise error.Abort(_("received file revlog group is empty"))
1392 raise error.Abort(_("received file revlog group is empty"))
1393 except error.CensoredBaseError as e:
1393 except error.CensoredBaseError as e:
1394 raise error.Abort(_("received delta base is censored: %s") % e)
1394 raise error.Abort(_("received delta base is censored: %s") % e)
1395 revisions += len(fl) - o
1395 revisions += len(fl) - o
1396 if f in needfiles:
1396 if f in needfiles:
1397 needs = needfiles[f]
1397 needs = needfiles[f]
1398 for new in pycompat.xrange(o, len(fl)):
1398 for new in pycompat.xrange(o, len(fl)):
1399 n = fl.node(new)
1399 n = fl.node(new)
1400 if n in needs:
1400 if n in needs:
1401 needs.remove(n)
1401 needs.remove(n)
1402 else:
1402 else:
1403 raise error.Abort(
1403 raise error.Abort(
1404 _("received spurious file revlog entry"))
1404 _("received spurious file revlog entry"))
1405 if not needs:
1405 if not needs:
1406 del needfiles[f]
1406 del needfiles[f]
1407 progress.complete()
1407 progress.complete()
1408
1408
1409 for f, needs in needfiles.iteritems():
1409 for f, needs in needfiles.iteritems():
1410 fl = repo.file(f)
1410 fl = repo.file(f)
1411 for n in needs:
1411 for n in needs:
1412 try:
1412 try:
1413 fl.rev(n)
1413 fl.rev(n)
1414 except error.LookupError:
1414 except error.LookupError:
1415 raise error.Abort(
1415 raise error.Abort(
1416 _('missing file data for %s:%s - run hg verify') %
1416 _('missing file data for %s:%s - run hg verify') %
1417 (f, hex(n)))
1417 (f, hex(n)))
1418
1418
1419 return revisions, files
1419 return revisions, files
General Comments 0
You need to be logged in to leave comments. Login now