##// END OF EJS Templates
changegroup: make _revisiondeltanarrow() a standalone function...
Gregory Szorc -
r39040:e11d07cc default
parent child Browse files
Show More
@@ -1,1423 +1,1423 b''
1 # changegroup.py - Mercurial changegroup manipulation functions
1 # changegroup.py - Mercurial changegroup manipulation functions
2 #
2 #
3 # Copyright 2006 Matt Mackall <mpm@selenic.com>
3 # Copyright 2006 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import os
10 import os
11 import struct
11 import struct
12 import weakref
12 import weakref
13
13
14 from .i18n import _
14 from .i18n import _
15 from .node import (
15 from .node import (
16 hex,
16 hex,
17 nullid,
17 nullid,
18 nullrev,
18 nullrev,
19 short,
19 short,
20 )
20 )
21
21
22 from .thirdparty import (
22 from .thirdparty import (
23 attr,
23 attr,
24 )
24 )
25
25
26 from . import (
26 from . import (
27 dagutil,
27 dagutil,
28 error,
28 error,
29 manifest,
29 manifest,
30 match as matchmod,
30 match as matchmod,
31 mdiff,
31 mdiff,
32 phases,
32 phases,
33 pycompat,
33 pycompat,
34 repository,
34 repository,
35 revlog,
35 revlog,
36 util,
36 util,
37 )
37 )
38
38
39 from .utils import (
39 from .utils import (
40 stringutil,
40 stringutil,
41 )
41 )
42
42
43 _CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")
43 _CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")
44 _CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")
44 _CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")
45 _CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")
45 _CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")
46
46
47 LFS_REQUIREMENT = 'lfs'
47 LFS_REQUIREMENT = 'lfs'
48
48
49 readexactly = util.readexactly
49 readexactly = util.readexactly
50
50
51 def getchunk(stream):
51 def getchunk(stream):
52 """return the next chunk from stream as a string"""
52 """return the next chunk from stream as a string"""
53 d = readexactly(stream, 4)
53 d = readexactly(stream, 4)
54 l = struct.unpack(">l", d)[0]
54 l = struct.unpack(">l", d)[0]
55 if l <= 4:
55 if l <= 4:
56 if l:
56 if l:
57 raise error.Abort(_("invalid chunk length %d") % l)
57 raise error.Abort(_("invalid chunk length %d") % l)
58 return ""
58 return ""
59 return readexactly(stream, l - 4)
59 return readexactly(stream, l - 4)
60
60
61 def chunkheader(length):
61 def chunkheader(length):
62 """return a changegroup chunk header (string)"""
62 """return a changegroup chunk header (string)"""
63 return struct.pack(">l", length + 4)
63 return struct.pack(">l", length + 4)
64
64
65 def closechunk():
65 def closechunk():
66 """return a changegroup chunk header (string) for a zero-length chunk"""
66 """return a changegroup chunk header (string) for a zero-length chunk"""
67 return struct.pack(">l", 0)
67 return struct.pack(">l", 0)
68
68
69 def _fileheader(path):
69 def _fileheader(path):
70 """Obtain a changegroup chunk header for a named path."""
70 """Obtain a changegroup chunk header for a named path."""
71 return chunkheader(len(path)) + path
71 return chunkheader(len(path)) + path
72
72
73 def writechunks(ui, chunks, filename, vfs=None):
73 def writechunks(ui, chunks, filename, vfs=None):
74 """Write chunks to a file and return its filename.
74 """Write chunks to a file and return its filename.
75
75
76 The stream is assumed to be a bundle file.
76 The stream is assumed to be a bundle file.
77 Existing files will not be overwritten.
77 Existing files will not be overwritten.
78 If no filename is specified, a temporary file is created.
78 If no filename is specified, a temporary file is created.
79 """
79 """
80 fh = None
80 fh = None
81 cleanup = None
81 cleanup = None
82 try:
82 try:
83 if filename:
83 if filename:
84 if vfs:
84 if vfs:
85 fh = vfs.open(filename, "wb")
85 fh = vfs.open(filename, "wb")
86 else:
86 else:
87 # Increase default buffer size because default is usually
87 # Increase default buffer size because default is usually
88 # small (4k is common on Linux).
88 # small (4k is common on Linux).
89 fh = open(filename, "wb", 131072)
89 fh = open(filename, "wb", 131072)
90 else:
90 else:
91 fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
91 fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
92 fh = os.fdopen(fd, r"wb")
92 fh = os.fdopen(fd, r"wb")
93 cleanup = filename
93 cleanup = filename
94 for c in chunks:
94 for c in chunks:
95 fh.write(c)
95 fh.write(c)
96 cleanup = None
96 cleanup = None
97 return filename
97 return filename
98 finally:
98 finally:
99 if fh is not None:
99 if fh is not None:
100 fh.close()
100 fh.close()
101 if cleanup is not None:
101 if cleanup is not None:
102 if filename and vfs:
102 if filename and vfs:
103 vfs.unlink(cleanup)
103 vfs.unlink(cleanup)
104 else:
104 else:
105 os.unlink(cleanup)
105 os.unlink(cleanup)
106
106
107 class cg1unpacker(object):
107 class cg1unpacker(object):
108 """Unpacker for cg1 changegroup streams.
108 """Unpacker for cg1 changegroup streams.
109
109
110 A changegroup unpacker handles the framing of the revision data in
110 A changegroup unpacker handles the framing of the revision data in
111 the wire format. Most consumers will want to use the apply()
111 the wire format. Most consumers will want to use the apply()
112 method to add the changes from the changegroup to a repository.
112 method to add the changes from the changegroup to a repository.
113
113
114 If you're forwarding a changegroup unmodified to another consumer,
114 If you're forwarding a changegroup unmodified to another consumer,
115 use getchunks(), which returns an iterator of changegroup
115 use getchunks(), which returns an iterator of changegroup
116 chunks. This is mostly useful for cases where you need to know the
116 chunks. This is mostly useful for cases where you need to know the
117 data stream has ended by observing the end of the changegroup.
117 data stream has ended by observing the end of the changegroup.
118
118
119 deltachunk() is useful only if you're applying delta data. Most
119 deltachunk() is useful only if you're applying delta data. Most
120 consumers should prefer apply() instead.
120 consumers should prefer apply() instead.
121
121
122 A few other public methods exist. Those are used only for
122 A few other public methods exist. Those are used only for
123 bundlerepo and some debug commands - their use is discouraged.
123 bundlerepo and some debug commands - their use is discouraged.
124 """
124 """
125 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
125 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
126 deltaheadersize = deltaheader.size
126 deltaheadersize = deltaheader.size
127 version = '01'
127 version = '01'
128 _grouplistcount = 1 # One list of files after the manifests
128 _grouplistcount = 1 # One list of files after the manifests
129
129
130 def __init__(self, fh, alg, extras=None):
130 def __init__(self, fh, alg, extras=None):
131 if alg is None:
131 if alg is None:
132 alg = 'UN'
132 alg = 'UN'
133 if alg not in util.compengines.supportedbundletypes:
133 if alg not in util.compengines.supportedbundletypes:
134 raise error.Abort(_('unknown stream compression type: %s')
134 raise error.Abort(_('unknown stream compression type: %s')
135 % alg)
135 % alg)
136 if alg == 'BZ':
136 if alg == 'BZ':
137 alg = '_truncatedBZ'
137 alg = '_truncatedBZ'
138
138
139 compengine = util.compengines.forbundletype(alg)
139 compengine = util.compengines.forbundletype(alg)
140 self._stream = compengine.decompressorreader(fh)
140 self._stream = compengine.decompressorreader(fh)
141 self._type = alg
141 self._type = alg
142 self.extras = extras or {}
142 self.extras = extras or {}
143 self.callback = None
143 self.callback = None
144
144
145 # These methods (compressed, read, seek, tell) all appear to only
145 # These methods (compressed, read, seek, tell) all appear to only
146 # be used by bundlerepo, but it's a little hard to tell.
146 # be used by bundlerepo, but it's a little hard to tell.
147 def compressed(self):
147 def compressed(self):
148 return self._type is not None and self._type != 'UN'
148 return self._type is not None and self._type != 'UN'
149 def read(self, l):
149 def read(self, l):
150 return self._stream.read(l)
150 return self._stream.read(l)
151 def seek(self, pos):
151 def seek(self, pos):
152 return self._stream.seek(pos)
152 return self._stream.seek(pos)
153 def tell(self):
153 def tell(self):
154 return self._stream.tell()
154 return self._stream.tell()
155 def close(self):
155 def close(self):
156 return self._stream.close()
156 return self._stream.close()
157
157
158 def _chunklength(self):
158 def _chunklength(self):
159 d = readexactly(self._stream, 4)
159 d = readexactly(self._stream, 4)
160 l = struct.unpack(">l", d)[0]
160 l = struct.unpack(">l", d)[0]
161 if l <= 4:
161 if l <= 4:
162 if l:
162 if l:
163 raise error.Abort(_("invalid chunk length %d") % l)
163 raise error.Abort(_("invalid chunk length %d") % l)
164 return 0
164 return 0
165 if self.callback:
165 if self.callback:
166 self.callback()
166 self.callback()
167 return l - 4
167 return l - 4
168
168
169 def changelogheader(self):
169 def changelogheader(self):
170 """v10 does not have a changelog header chunk"""
170 """v10 does not have a changelog header chunk"""
171 return {}
171 return {}
172
172
173 def manifestheader(self):
173 def manifestheader(self):
174 """v10 does not have a manifest header chunk"""
174 """v10 does not have a manifest header chunk"""
175 return {}
175 return {}
176
176
177 def filelogheader(self):
177 def filelogheader(self):
178 """return the header of the filelogs chunk, v10 only has the filename"""
178 """return the header of the filelogs chunk, v10 only has the filename"""
179 l = self._chunklength()
179 l = self._chunklength()
180 if not l:
180 if not l:
181 return {}
181 return {}
182 fname = readexactly(self._stream, l)
182 fname = readexactly(self._stream, l)
183 return {'filename': fname}
183 return {'filename': fname}
184
184
185 def _deltaheader(self, headertuple, prevnode):
185 def _deltaheader(self, headertuple, prevnode):
186 node, p1, p2, cs = headertuple
186 node, p1, p2, cs = headertuple
187 if prevnode is None:
187 if prevnode is None:
188 deltabase = p1
188 deltabase = p1
189 else:
189 else:
190 deltabase = prevnode
190 deltabase = prevnode
191 flags = 0
191 flags = 0
192 return node, p1, p2, deltabase, cs, flags
192 return node, p1, p2, deltabase, cs, flags
193
193
194 def deltachunk(self, prevnode):
194 def deltachunk(self, prevnode):
195 l = self._chunklength()
195 l = self._chunklength()
196 if not l:
196 if not l:
197 return {}
197 return {}
198 headerdata = readexactly(self._stream, self.deltaheadersize)
198 headerdata = readexactly(self._stream, self.deltaheadersize)
199 header = self.deltaheader.unpack(headerdata)
199 header = self.deltaheader.unpack(headerdata)
200 delta = readexactly(self._stream, l - self.deltaheadersize)
200 delta = readexactly(self._stream, l - self.deltaheadersize)
201 node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
201 node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
202 return (node, p1, p2, cs, deltabase, delta, flags)
202 return (node, p1, p2, cs, deltabase, delta, flags)
203
203
204 def getchunks(self):
204 def getchunks(self):
205 """returns all the chunks contains in the bundle
205 """returns all the chunks contains in the bundle
206
206
207 Used when you need to forward the binary stream to a file or another
207 Used when you need to forward the binary stream to a file or another
208 network API. To do so, it parse the changegroup data, otherwise it will
208 network API. To do so, it parse the changegroup data, otherwise it will
209 block in case of sshrepo because it don't know the end of the stream.
209 block in case of sshrepo because it don't know the end of the stream.
210 """
210 """
211 # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
211 # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
212 # and a list of filelogs. For changegroup 3, we expect 4 parts:
212 # and a list of filelogs. For changegroup 3, we expect 4 parts:
213 # changelog, manifestlog, a list of tree manifestlogs, and a list of
213 # changelog, manifestlog, a list of tree manifestlogs, and a list of
214 # filelogs.
214 # filelogs.
215 #
215 #
216 # Changelog and manifestlog parts are terminated with empty chunks. The
216 # Changelog and manifestlog parts are terminated with empty chunks. The
217 # tree and file parts are a list of entry sections. Each entry section
217 # tree and file parts are a list of entry sections. Each entry section
218 # is a series of chunks terminating in an empty chunk. The list of these
218 # is a series of chunks terminating in an empty chunk. The list of these
219 # entry sections is terminated in yet another empty chunk, so we know
219 # entry sections is terminated in yet another empty chunk, so we know
220 # we've reached the end of the tree/file list when we reach an empty
220 # we've reached the end of the tree/file list when we reach an empty
221 # chunk that was proceeded by no non-empty chunks.
221 # chunk that was proceeded by no non-empty chunks.
222
222
223 parts = 0
223 parts = 0
224 while parts < 2 + self._grouplistcount:
224 while parts < 2 + self._grouplistcount:
225 noentries = True
225 noentries = True
226 while True:
226 while True:
227 chunk = getchunk(self)
227 chunk = getchunk(self)
228 if not chunk:
228 if not chunk:
229 # The first two empty chunks represent the end of the
229 # The first two empty chunks represent the end of the
230 # changelog and the manifestlog portions. The remaining
230 # changelog and the manifestlog portions. The remaining
231 # empty chunks represent either A) the end of individual
231 # empty chunks represent either A) the end of individual
232 # tree or file entries in the file list, or B) the end of
232 # tree or file entries in the file list, or B) the end of
233 # the entire list. It's the end of the entire list if there
233 # the entire list. It's the end of the entire list if there
234 # were no entries (i.e. noentries is True).
234 # were no entries (i.e. noentries is True).
235 if parts < 2:
235 if parts < 2:
236 parts += 1
236 parts += 1
237 elif noentries:
237 elif noentries:
238 parts += 1
238 parts += 1
239 break
239 break
240 noentries = False
240 noentries = False
241 yield chunkheader(len(chunk))
241 yield chunkheader(len(chunk))
242 pos = 0
242 pos = 0
243 while pos < len(chunk):
243 while pos < len(chunk):
244 next = pos + 2**20
244 next = pos + 2**20
245 yield chunk[pos:next]
245 yield chunk[pos:next]
246 pos = next
246 pos = next
247 yield closechunk()
247 yield closechunk()
248
248
249 def _unpackmanifests(self, repo, revmap, trp, prog):
249 def _unpackmanifests(self, repo, revmap, trp, prog):
250 self.callback = prog.increment
250 self.callback = prog.increment
251 # no need to check for empty manifest group here:
251 # no need to check for empty manifest group here:
252 # if the result of the merge of 1 and 2 is the same in 3 and 4,
252 # if the result of the merge of 1 and 2 is the same in 3 and 4,
253 # no new manifest will be created and the manifest group will
253 # no new manifest will be created and the manifest group will
254 # be empty during the pull
254 # be empty during the pull
255 self.manifestheader()
255 self.manifestheader()
256 deltas = self.deltaiter()
256 deltas = self.deltaiter()
257 repo.manifestlog.addgroup(deltas, revmap, trp)
257 repo.manifestlog.addgroup(deltas, revmap, trp)
258 prog.complete()
258 prog.complete()
259 self.callback = None
259 self.callback = None
260
260
261 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
261 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
262 expectedtotal=None):
262 expectedtotal=None):
263 """Add the changegroup returned by source.read() to this repo.
263 """Add the changegroup returned by source.read() to this repo.
264 srctype is a string like 'push', 'pull', or 'unbundle'. url is
264 srctype is a string like 'push', 'pull', or 'unbundle'. url is
265 the URL of the repo where this changegroup is coming from.
265 the URL of the repo where this changegroup is coming from.
266
266
267 Return an integer summarizing the change to this repo:
267 Return an integer summarizing the change to this repo:
268 - nothing changed or no source: 0
268 - nothing changed or no source: 0
269 - more heads than before: 1+added heads (2..n)
269 - more heads than before: 1+added heads (2..n)
270 - fewer heads than before: -1-removed heads (-2..-n)
270 - fewer heads than before: -1-removed heads (-2..-n)
271 - number of heads stays the same: 1
271 - number of heads stays the same: 1
272 """
272 """
273 repo = repo.unfiltered()
273 repo = repo.unfiltered()
274 def csmap(x):
274 def csmap(x):
275 repo.ui.debug("add changeset %s\n" % short(x))
275 repo.ui.debug("add changeset %s\n" % short(x))
276 return len(cl)
276 return len(cl)
277
277
278 def revmap(x):
278 def revmap(x):
279 return cl.rev(x)
279 return cl.rev(x)
280
280
281 changesets = files = revisions = 0
281 changesets = files = revisions = 0
282
282
283 try:
283 try:
284 # The transaction may already carry source information. In this
284 # The transaction may already carry source information. In this
285 # case we use the top level data. We overwrite the argument
285 # case we use the top level data. We overwrite the argument
286 # because we need to use the top level value (if they exist)
286 # because we need to use the top level value (if they exist)
287 # in this function.
287 # in this function.
288 srctype = tr.hookargs.setdefault('source', srctype)
288 srctype = tr.hookargs.setdefault('source', srctype)
289 url = tr.hookargs.setdefault('url', url)
289 url = tr.hookargs.setdefault('url', url)
290 repo.hook('prechangegroup',
290 repo.hook('prechangegroup',
291 throw=True, **pycompat.strkwargs(tr.hookargs))
291 throw=True, **pycompat.strkwargs(tr.hookargs))
292
292
293 # write changelog data to temp files so concurrent readers
293 # write changelog data to temp files so concurrent readers
294 # will not see an inconsistent view
294 # will not see an inconsistent view
295 cl = repo.changelog
295 cl = repo.changelog
296 cl.delayupdate(tr)
296 cl.delayupdate(tr)
297 oldheads = set(cl.heads())
297 oldheads = set(cl.heads())
298
298
299 trp = weakref.proxy(tr)
299 trp = weakref.proxy(tr)
300 # pull off the changeset group
300 # pull off the changeset group
301 repo.ui.status(_("adding changesets\n"))
301 repo.ui.status(_("adding changesets\n"))
302 clstart = len(cl)
302 clstart = len(cl)
303 progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
303 progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
304 total=expectedtotal)
304 total=expectedtotal)
305 self.callback = progress.increment
305 self.callback = progress.increment
306
306
307 efiles = set()
307 efiles = set()
308 def onchangelog(cl, node):
308 def onchangelog(cl, node):
309 efiles.update(cl.readfiles(node))
309 efiles.update(cl.readfiles(node))
310
310
311 self.changelogheader()
311 self.changelogheader()
312 deltas = self.deltaiter()
312 deltas = self.deltaiter()
313 cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
313 cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
314 efiles = len(efiles)
314 efiles = len(efiles)
315
315
316 if not cgnodes:
316 if not cgnodes:
317 repo.ui.develwarn('applied empty changegroup',
317 repo.ui.develwarn('applied empty changegroup',
318 config='warn-empty-changegroup')
318 config='warn-empty-changegroup')
319 clend = len(cl)
319 clend = len(cl)
320 changesets = clend - clstart
320 changesets = clend - clstart
321 progress.complete()
321 progress.complete()
322 self.callback = None
322 self.callback = None
323
323
324 # pull off the manifest group
324 # pull off the manifest group
325 repo.ui.status(_("adding manifests\n"))
325 repo.ui.status(_("adding manifests\n"))
326 # We know that we'll never have more manifests than we had
326 # We know that we'll never have more manifests than we had
327 # changesets.
327 # changesets.
328 progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
328 progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
329 total=changesets)
329 total=changesets)
330 self._unpackmanifests(repo, revmap, trp, progress)
330 self._unpackmanifests(repo, revmap, trp, progress)
331
331
332 needfiles = {}
332 needfiles = {}
333 if repo.ui.configbool('server', 'validate'):
333 if repo.ui.configbool('server', 'validate'):
334 cl = repo.changelog
334 cl = repo.changelog
335 ml = repo.manifestlog
335 ml = repo.manifestlog
336 # validate incoming csets have their manifests
336 # validate incoming csets have their manifests
337 for cset in pycompat.xrange(clstart, clend):
337 for cset in pycompat.xrange(clstart, clend):
338 mfnode = cl.changelogrevision(cset).manifest
338 mfnode = cl.changelogrevision(cset).manifest
339 mfest = ml[mfnode].readdelta()
339 mfest = ml[mfnode].readdelta()
340 # store file cgnodes we must see
340 # store file cgnodes we must see
341 for f, n in mfest.iteritems():
341 for f, n in mfest.iteritems():
342 needfiles.setdefault(f, set()).add(n)
342 needfiles.setdefault(f, set()).add(n)
343
343
344 # process the files
344 # process the files
345 repo.ui.status(_("adding file changes\n"))
345 repo.ui.status(_("adding file changes\n"))
346 newrevs, newfiles = _addchangegroupfiles(
346 newrevs, newfiles = _addchangegroupfiles(
347 repo, self, revmap, trp, efiles, needfiles)
347 repo, self, revmap, trp, efiles, needfiles)
348 revisions += newrevs
348 revisions += newrevs
349 files += newfiles
349 files += newfiles
350
350
351 deltaheads = 0
351 deltaheads = 0
352 if oldheads:
352 if oldheads:
353 heads = cl.heads()
353 heads = cl.heads()
354 deltaheads = len(heads) - len(oldheads)
354 deltaheads = len(heads) - len(oldheads)
355 for h in heads:
355 for h in heads:
356 if h not in oldheads and repo[h].closesbranch():
356 if h not in oldheads and repo[h].closesbranch():
357 deltaheads -= 1
357 deltaheads -= 1
358 htext = ""
358 htext = ""
359 if deltaheads:
359 if deltaheads:
360 htext = _(" (%+d heads)") % deltaheads
360 htext = _(" (%+d heads)") % deltaheads
361
361
362 repo.ui.status(_("added %d changesets"
362 repo.ui.status(_("added %d changesets"
363 " with %d changes to %d files%s\n")
363 " with %d changes to %d files%s\n")
364 % (changesets, revisions, files, htext))
364 % (changesets, revisions, files, htext))
365 repo.invalidatevolatilesets()
365 repo.invalidatevolatilesets()
366
366
367 if changesets > 0:
367 if changesets > 0:
368 if 'node' not in tr.hookargs:
368 if 'node' not in tr.hookargs:
369 tr.hookargs['node'] = hex(cl.node(clstart))
369 tr.hookargs['node'] = hex(cl.node(clstart))
370 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
370 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
371 hookargs = dict(tr.hookargs)
371 hookargs = dict(tr.hookargs)
372 else:
372 else:
373 hookargs = dict(tr.hookargs)
373 hookargs = dict(tr.hookargs)
374 hookargs['node'] = hex(cl.node(clstart))
374 hookargs['node'] = hex(cl.node(clstart))
375 hookargs['node_last'] = hex(cl.node(clend - 1))
375 hookargs['node_last'] = hex(cl.node(clend - 1))
376 repo.hook('pretxnchangegroup',
376 repo.hook('pretxnchangegroup',
377 throw=True, **pycompat.strkwargs(hookargs))
377 throw=True, **pycompat.strkwargs(hookargs))
378
378
379 added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
379 added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
380 phaseall = None
380 phaseall = None
381 if srctype in ('push', 'serve'):
381 if srctype in ('push', 'serve'):
382 # Old servers can not push the boundary themselves.
382 # Old servers can not push the boundary themselves.
383 # New servers won't push the boundary if changeset already
383 # New servers won't push the boundary if changeset already
384 # exists locally as secret
384 # exists locally as secret
385 #
385 #
386 # We should not use added here but the list of all change in
386 # We should not use added here but the list of all change in
387 # the bundle
387 # the bundle
388 if repo.publishing():
388 if repo.publishing():
389 targetphase = phaseall = phases.public
389 targetphase = phaseall = phases.public
390 else:
390 else:
391 # closer target phase computation
391 # closer target phase computation
392
392
393 # Those changesets have been pushed from the
393 # Those changesets have been pushed from the
394 # outside, their phases are going to be pushed
394 # outside, their phases are going to be pushed
395 # alongside. Therefor `targetphase` is
395 # alongside. Therefor `targetphase` is
396 # ignored.
396 # ignored.
397 targetphase = phaseall = phases.draft
397 targetphase = phaseall = phases.draft
398 if added:
398 if added:
399 phases.registernew(repo, tr, targetphase, added)
399 phases.registernew(repo, tr, targetphase, added)
400 if phaseall is not None:
400 if phaseall is not None:
401 phases.advanceboundary(repo, tr, phaseall, cgnodes)
401 phases.advanceboundary(repo, tr, phaseall, cgnodes)
402
402
403 if changesets > 0:
403 if changesets > 0:
404
404
405 def runhooks():
405 def runhooks():
406 # These hooks run when the lock releases, not when the
406 # These hooks run when the lock releases, not when the
407 # transaction closes. So it's possible for the changelog
407 # transaction closes. So it's possible for the changelog
408 # to have changed since we last saw it.
408 # to have changed since we last saw it.
409 if clstart >= len(repo):
409 if clstart >= len(repo):
410 return
410 return
411
411
412 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
412 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
413
413
414 for n in added:
414 for n in added:
415 args = hookargs.copy()
415 args = hookargs.copy()
416 args['node'] = hex(n)
416 args['node'] = hex(n)
417 del args['node_last']
417 del args['node_last']
418 repo.hook("incoming", **pycompat.strkwargs(args))
418 repo.hook("incoming", **pycompat.strkwargs(args))
419
419
420 newheads = [h for h in repo.heads()
420 newheads = [h for h in repo.heads()
421 if h not in oldheads]
421 if h not in oldheads]
422 repo.ui.log("incoming",
422 repo.ui.log("incoming",
423 "%d incoming changes - new heads: %s\n",
423 "%d incoming changes - new heads: %s\n",
424 len(added),
424 len(added),
425 ', '.join([hex(c[:6]) for c in newheads]))
425 ', '.join([hex(c[:6]) for c in newheads]))
426
426
427 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
427 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
428 lambda tr: repo._afterlock(runhooks))
428 lambda tr: repo._afterlock(runhooks))
429 finally:
429 finally:
430 repo.ui.flush()
430 repo.ui.flush()
431 # never return 0 here:
431 # never return 0 here:
432 if deltaheads < 0:
432 if deltaheads < 0:
433 ret = deltaheads - 1
433 ret = deltaheads - 1
434 else:
434 else:
435 ret = deltaheads + 1
435 ret = deltaheads + 1
436 return ret
436 return ret
437
437
438 def deltaiter(self):
438 def deltaiter(self):
439 """
439 """
440 returns an iterator of the deltas in this changegroup
440 returns an iterator of the deltas in this changegroup
441
441
442 Useful for passing to the underlying storage system to be stored.
442 Useful for passing to the underlying storage system to be stored.
443 """
443 """
444 chain = None
444 chain = None
445 for chunkdata in iter(lambda: self.deltachunk(chain), {}):
445 for chunkdata in iter(lambda: self.deltachunk(chain), {}):
446 # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
446 # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
447 yield chunkdata
447 yield chunkdata
448 chain = chunkdata[0]
448 chain = chunkdata[0]
449
449
450 class cg2unpacker(cg1unpacker):
450 class cg2unpacker(cg1unpacker):
451 """Unpacker for cg2 streams.
451 """Unpacker for cg2 streams.
452
452
453 cg2 streams add support for generaldelta, so the delta header
453 cg2 streams add support for generaldelta, so the delta header
454 format is slightly different. All other features about the data
454 format is slightly different. All other features about the data
455 remain the same.
455 remain the same.
456 """
456 """
457 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
457 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
458 deltaheadersize = deltaheader.size
458 deltaheadersize = deltaheader.size
459 version = '02'
459 version = '02'
460
460
461 def _deltaheader(self, headertuple, prevnode):
461 def _deltaheader(self, headertuple, prevnode):
462 node, p1, p2, deltabase, cs = headertuple
462 node, p1, p2, deltabase, cs = headertuple
463 flags = 0
463 flags = 0
464 return node, p1, p2, deltabase, cs, flags
464 return node, p1, p2, deltabase, cs, flags
465
465
466 class cg3unpacker(cg2unpacker):
466 class cg3unpacker(cg2unpacker):
467 """Unpacker for cg3 streams.
467 """Unpacker for cg3 streams.
468
468
469 cg3 streams add support for exchanging treemanifests and revlog
469 cg3 streams add support for exchanging treemanifests and revlog
470 flags. It adds the revlog flags to the delta header and an empty chunk
470 flags. It adds the revlog flags to the delta header and an empty chunk
471 separating manifests and files.
471 separating manifests and files.
472 """
472 """
473 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
473 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
474 deltaheadersize = deltaheader.size
474 deltaheadersize = deltaheader.size
475 version = '03'
475 version = '03'
476 _grouplistcount = 2 # One list of manifests and one list of files
476 _grouplistcount = 2 # One list of manifests and one list of files
477
477
478 def _deltaheader(self, headertuple, prevnode):
478 def _deltaheader(self, headertuple, prevnode):
479 node, p1, p2, deltabase, cs, flags = headertuple
479 node, p1, p2, deltabase, cs, flags = headertuple
480 return node, p1, p2, deltabase, cs, flags
480 return node, p1, p2, deltabase, cs, flags
481
481
482 def _unpackmanifests(self, repo, revmap, trp, prog):
482 def _unpackmanifests(self, repo, revmap, trp, prog):
483 super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
483 super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
484 for chunkdata in iter(self.filelogheader, {}):
484 for chunkdata in iter(self.filelogheader, {}):
485 # If we get here, there are directory manifests in the changegroup
485 # If we get here, there are directory manifests in the changegroup
486 d = chunkdata["filename"]
486 d = chunkdata["filename"]
487 repo.ui.debug("adding %s revisions\n" % d)
487 repo.ui.debug("adding %s revisions\n" % d)
488 dirlog = repo.manifestlog._revlog.dirlog(d)
488 dirlog = repo.manifestlog._revlog.dirlog(d)
489 deltas = self.deltaiter()
489 deltas = self.deltaiter()
490 if not dirlog.addgroup(deltas, revmap, trp):
490 if not dirlog.addgroup(deltas, revmap, trp):
491 raise error.Abort(_("received dir revlog group is empty"))
491 raise error.Abort(_("received dir revlog group is empty"))
492
492
493 class headerlessfixup(object):
493 class headerlessfixup(object):
494 def __init__(self, fh, h):
494 def __init__(self, fh, h):
495 self._h = h
495 self._h = h
496 self._fh = fh
496 self._fh = fh
497 def read(self, n):
497 def read(self, n):
498 if self._h:
498 if self._h:
499 d, self._h = self._h[:n], self._h[n:]
499 d, self._h = self._h[:n], self._h[n:]
500 if len(d) < n:
500 if len(d) < n:
501 d += readexactly(self._fh, n - len(d))
501 d += readexactly(self._fh, n - len(d))
502 return d
502 return d
503 return readexactly(self._fh, n)
503 return readexactly(self._fh, n)
504
504
505 @attr.s(slots=True, frozen=True)
505 @attr.s(slots=True, frozen=True)
506 class revisiondelta(object):
506 class revisiondelta(object):
507 """Describes a delta entry in a changegroup.
507 """Describes a delta entry in a changegroup.
508
508
509 Captured data is sufficient to serialize the delta into multiple
509 Captured data is sufficient to serialize the delta into multiple
510 formats.
510 formats.
511 """
511 """
512 # 20 byte node of this revision.
512 # 20 byte node of this revision.
513 node = attr.ib()
513 node = attr.ib()
514 # 20 byte nodes of parent revisions.
514 # 20 byte nodes of parent revisions.
515 p1node = attr.ib()
515 p1node = attr.ib()
516 p2node = attr.ib()
516 p2node = attr.ib()
517 # 20 byte node of node this delta is against.
517 # 20 byte node of node this delta is against.
518 basenode = attr.ib()
518 basenode = attr.ib()
519 # 20 byte node of changeset revision this delta is associated with.
519 # 20 byte node of changeset revision this delta is associated with.
520 linknode = attr.ib()
520 linknode = attr.ib()
521 # 2 bytes of flags to apply to revision data.
521 # 2 bytes of flags to apply to revision data.
522 flags = attr.ib()
522 flags = attr.ib()
523 # Iterable of chunks holding raw delta data.
523 # Iterable of chunks holding raw delta data.
524 deltachunks = attr.ib()
524 deltachunks = attr.ib()
525
525
526 def _sortnodesnormal(store, nodes, reorder):
526 def _sortnodesnormal(store, nodes, reorder):
527 """Sort nodes for changegroup generation and turn into revnums."""
527 """Sort nodes for changegroup generation and turn into revnums."""
528 # for generaldelta revlogs, we linearize the revs; this will both be
528 # for generaldelta revlogs, we linearize the revs; this will both be
529 # much quicker and generate a much smaller bundle
529 # much quicker and generate a much smaller bundle
530 if (store._generaldelta and reorder is None) or reorder:
530 if (store._generaldelta and reorder is None) or reorder:
531 dag = dagutil.revlogdag(store)
531 dag = dagutil.revlogdag(store)
532 return dag.linearize(set(store.rev(n) for n in nodes))
532 return dag.linearize(set(store.rev(n) for n in nodes))
533 else:
533 else:
534 return sorted([store.rev(n) for n in nodes])
534 return sorted([store.rev(n) for n in nodes])
535
535
536 def _sortnodesellipsis(store, nodes, cl, lookup):
536 def _sortnodesellipsis(store, nodes, cl, lookup):
537 """Sort nodes for changegroup generation and turn into revnums."""
537 """Sort nodes for changegroup generation and turn into revnums."""
538 # Ellipses serving mode.
538 # Ellipses serving mode.
539 #
539 #
540 # In a perfect world, we'd generate better ellipsis-ified graphs
540 # In a perfect world, we'd generate better ellipsis-ified graphs
541 # for non-changelog revlogs. In practice, we haven't started doing
541 # for non-changelog revlogs. In practice, we haven't started doing
542 # that yet, so the resulting DAGs for the manifestlog and filelogs
542 # that yet, so the resulting DAGs for the manifestlog and filelogs
543 # are actually full of bogus parentage on all the ellipsis
543 # are actually full of bogus parentage on all the ellipsis
544 # nodes. This has the side effect that, while the contents are
544 # nodes. This has the side effect that, while the contents are
545 # correct, the individual DAGs might be completely out of whack in
545 # correct, the individual DAGs might be completely out of whack in
546 # a case like 882681bc3166 and its ancestors (back about 10
546 # a case like 882681bc3166 and its ancestors (back about 10
547 # revisions or so) in the main hg repo.
547 # revisions or so) in the main hg repo.
548 #
548 #
549 # The one invariant we *know* holds is that the new (potentially
549 # The one invariant we *know* holds is that the new (potentially
550 # bogus) DAG shape will be valid if we order the nodes in the
550 # bogus) DAG shape will be valid if we order the nodes in the
551 # order that they're introduced in dramatis personae by the
551 # order that they're introduced in dramatis personae by the
552 # changelog, so what we do is we sort the non-changelog histories
552 # changelog, so what we do is we sort the non-changelog histories
553 # by the order in which they are used by the changelog.
553 # by the order in which they are used by the changelog.
554 key = lambda n: cl.rev(lookup(n))
554 key = lambda n: cl.rev(lookup(n))
555 return [store.rev(n) for n in sorted(nodes, key=key)]
555 return [store.rev(n) for n in sorted(nodes, key=key)]
556
556
557 def _revisiondeltanormal(store, rev, prev, linknode, deltaparentfn):
557 def _revisiondeltanormal(store, rev, prev, linknode, deltaparentfn):
558 """Construct a revision delta for non-ellipses changegroup generation."""
558 """Construct a revision delta for non-ellipses changegroup generation."""
559 node = store.node(rev)
559 node = store.node(rev)
560 p1, p2 = store.parentrevs(rev)
560 p1, p2 = store.parentrevs(rev)
561 base = deltaparentfn(store, rev, p1, p2, prev)
561 base = deltaparentfn(store, rev, p1, p2, prev)
562
562
563 prefix = ''
563 prefix = ''
564 if store.iscensored(base) or store.iscensored(rev):
564 if store.iscensored(base) or store.iscensored(rev):
565 try:
565 try:
566 delta = store.revision(node, raw=True)
566 delta = store.revision(node, raw=True)
567 except error.CensoredNodeError as e:
567 except error.CensoredNodeError as e:
568 delta = e.tombstone
568 delta = e.tombstone
569 if base == nullrev:
569 if base == nullrev:
570 prefix = mdiff.trivialdiffheader(len(delta))
570 prefix = mdiff.trivialdiffheader(len(delta))
571 else:
571 else:
572 baselen = store.rawsize(base)
572 baselen = store.rawsize(base)
573 prefix = mdiff.replacediffheader(baselen, len(delta))
573 prefix = mdiff.replacediffheader(baselen, len(delta))
574 elif base == nullrev:
574 elif base == nullrev:
575 delta = store.revision(node, raw=True)
575 delta = store.revision(node, raw=True)
576 prefix = mdiff.trivialdiffheader(len(delta))
576 prefix = mdiff.trivialdiffheader(len(delta))
577 else:
577 else:
578 delta = store.revdiff(base, rev)
578 delta = store.revdiff(base, rev)
579 p1n, p2n = store.parents(node)
579 p1n, p2n = store.parents(node)
580
580
581 return revisiondelta(
581 return revisiondelta(
582 node=node,
582 node=node,
583 p1node=p1n,
583 p1node=p1n,
584 p2node=p2n,
584 p2node=p2n,
585 basenode=store.node(base),
585 basenode=store.node(base),
586 linknode=linknode,
586 linknode=linknode,
587 flags=store.flags(rev),
587 flags=store.flags(rev),
588 deltachunks=(prefix, delta),
588 deltachunks=(prefix, delta),
589 )
589 )
590
590
591 def _revisiondeltanarrow(cl, store, ischangelog, rev, linkrev,
592 linknode, clrevtolocalrev, fullclnodes,
593 precomputedellipsis):
594 linkparents = precomputedellipsis[linkrev]
595 def local(clrev):
596 """Turn a changelog revnum into a local revnum.
597
598 The ellipsis dag is stored as revnums on the changelog,
599 but when we're producing ellipsis entries for
600 non-changelog revlogs, we need to turn those numbers into
601 something local. This does that for us, and during the
602 changelog sending phase will also expand the stored
603 mappings as needed.
604 """
605 if clrev == nullrev:
606 return nullrev
607
608 if ischangelog:
609 return clrev
610
611 # Walk the ellipsis-ized changelog breadth-first looking for a
612 # change that has been linked from the current revlog.
613 #
614 # For a flat manifest revlog only a single step should be necessary
615 # as all relevant changelog entries are relevant to the flat
616 # manifest.
617 #
618 # For a filelog or tree manifest dirlog however not every changelog
619 # entry will have been relevant, so we need to skip some changelog
620 # nodes even after ellipsis-izing.
621 walk = [clrev]
622 while walk:
623 p = walk[0]
624 walk = walk[1:]
625 if p in clrevtolocalrev:
626 return clrevtolocalrev[p]
627 elif p in fullclnodes:
628 walk.extend([pp for pp in cl.parentrevs(p)
629 if pp != nullrev])
630 elif p in precomputedellipsis:
631 walk.extend([pp for pp in precomputedellipsis[p]
632 if pp != nullrev])
633 else:
634 # In this case, we've got an ellipsis with parents
635 # outside the current bundle (likely an
636 # incremental pull). We "know" that we can use the
637 # value of this same revlog at whatever revision
638 # is pointed to by linknode. "Know" is in scare
639 # quotes because I haven't done enough examination
640 # of edge cases to convince myself this is really
641 # a fact - it works for all the (admittedly
642 # thorough) cases in our testsuite, but I would be
643 # somewhat unsurprised to find a case in the wild
644 # where this breaks down a bit. That said, I don't
645 # know if it would hurt anything.
646 for i in pycompat.xrange(rev, 0, -1):
647 if store.linkrev(i) == clrev:
648 return i
649 # We failed to resolve a parent for this node, so
650 # we crash the changegroup construction.
651 raise error.Abort(
652 'unable to resolve parent while packing %r %r'
653 ' for changeset %r' % (store.indexfile, rev, clrev))
654
655 return nullrev
656
657 if not linkparents or (
658 store.parentrevs(rev) == (nullrev, nullrev)):
659 p1, p2 = nullrev, nullrev
660 elif len(linkparents) == 1:
661 p1, = sorted(local(p) for p in linkparents)
662 p2 = nullrev
663 else:
664 p1, p2 = sorted(local(p) for p in linkparents)
665
666 n = store.node(rev)
667 p1n, p2n = store.node(p1), store.node(p2)
668 flags = store.flags(rev)
669 flags |= revlog.REVIDX_ELLIPSIS
670
671 # TODO: try and actually send deltas for ellipsis data blocks
672 data = store.revision(n)
673 diffheader = mdiff.trivialdiffheader(len(data))
674
675 return revisiondelta(
676 node=n,
677 p1node=p1n,
678 p2node=p2n,
679 basenode=nullid,
680 linknode=linknode,
681 flags=flags,
682 deltachunks=(diffheader, data),
683 )
684
591 class cgpacker(object):
685 class cgpacker(object):
592 def __init__(self, repo, filematcher, version, allowreorder,
686 def __init__(self, repo, filematcher, version, allowreorder,
593 deltaparentfn, builddeltaheader, manifestsend,
687 deltaparentfn, builddeltaheader, manifestsend,
594 bundlecaps=None, ellipses=False,
688 bundlecaps=None, ellipses=False,
595 shallow=False, ellipsisroots=None, fullnodes=None):
689 shallow=False, ellipsisroots=None, fullnodes=None):
596 """Given a source repo, construct a bundler.
690 """Given a source repo, construct a bundler.
597
691
598 filematcher is a matcher that matches on files to include in the
692 filematcher is a matcher that matches on files to include in the
599 changegroup. Used to facilitate sparse changegroups.
693 changegroup. Used to facilitate sparse changegroups.
600
694
601 allowreorder controls whether reordering of revisions is allowed.
695 allowreorder controls whether reordering of revisions is allowed.
602 This value is used when ``bundle.reorder`` is ``auto`` or isn't
696 This value is used when ``bundle.reorder`` is ``auto`` or isn't
603 set.
697 set.
604
698
605 deltaparentfn is a callable that resolves the delta parent for
699 deltaparentfn is a callable that resolves the delta parent for
606 a specific revision.
700 a specific revision.
607
701
608 builddeltaheader is a callable that constructs the header for a group
702 builddeltaheader is a callable that constructs the header for a group
609 delta.
703 delta.
610
704
611 manifestsend is a chunk to send after manifests have been fully emitted.
705 manifestsend is a chunk to send after manifests have been fully emitted.
612
706
613 ellipses indicates whether ellipsis serving mode is enabled.
707 ellipses indicates whether ellipsis serving mode is enabled.
614
708
615 bundlecaps is optional and can be used to specify the set of
709 bundlecaps is optional and can be used to specify the set of
616 capabilities which can be used to build the bundle. While bundlecaps is
710 capabilities which can be used to build the bundle. While bundlecaps is
617 unused in core Mercurial, extensions rely on this feature to communicate
711 unused in core Mercurial, extensions rely on this feature to communicate
618 capabilities to customize the changegroup packer.
712 capabilities to customize the changegroup packer.
619
713
620 shallow indicates whether shallow data might be sent. The packer may
714 shallow indicates whether shallow data might be sent. The packer may
621 need to pack file contents not introduced by the changes being packed.
715 need to pack file contents not introduced by the changes being packed.
622
716
623 fullnodes is the set of changelog nodes which should not be ellipsis
717 fullnodes is the set of changelog nodes which should not be ellipsis
624 nodes. We store this rather than the set of nodes that should be
718 nodes. We store this rather than the set of nodes that should be
625 ellipsis because for very large histories we expect this to be
719 ellipsis because for very large histories we expect this to be
626 significantly smaller.
720 significantly smaller.
627 """
721 """
628 assert filematcher
722 assert filematcher
629 self._filematcher = filematcher
723 self._filematcher = filematcher
630
724
631 self.version = version
725 self.version = version
632 self._deltaparentfn = deltaparentfn
726 self._deltaparentfn = deltaparentfn
633 self._builddeltaheader = builddeltaheader
727 self._builddeltaheader = builddeltaheader
634 self._manifestsend = manifestsend
728 self._manifestsend = manifestsend
635 self._ellipses = ellipses
729 self._ellipses = ellipses
636
730
637 # Set of capabilities we can use to build the bundle.
731 # Set of capabilities we can use to build the bundle.
638 if bundlecaps is None:
732 if bundlecaps is None:
639 bundlecaps = set()
733 bundlecaps = set()
640 self._bundlecaps = bundlecaps
734 self._bundlecaps = bundlecaps
641 self._isshallow = shallow
735 self._isshallow = shallow
642 self._fullclnodes = fullnodes
736 self._fullclnodes = fullnodes
643
737
644 # Maps ellipsis revs to their roots at the changelog level.
738 # Maps ellipsis revs to their roots at the changelog level.
645 self._precomputedellipsis = ellipsisroots
739 self._precomputedellipsis = ellipsisroots
646
740
647 # experimental config: bundle.reorder
741 # experimental config: bundle.reorder
648 reorder = repo.ui.config('bundle', 'reorder')
742 reorder = repo.ui.config('bundle', 'reorder')
649 if reorder == 'auto':
743 if reorder == 'auto':
650 self._reorder = allowreorder
744 self._reorder = allowreorder
651 else:
745 else:
652 self._reorder = stringutil.parsebool(reorder)
746 self._reorder = stringutil.parsebool(reorder)
653
747
654 self._repo = repo
748 self._repo = repo
655
749
656 if self._repo.ui.verbose and not self._repo.ui.debugflag:
750 if self._repo.ui.verbose and not self._repo.ui.debugflag:
657 self._verbosenote = self._repo.ui.note
751 self._verbosenote = self._repo.ui.note
658 else:
752 else:
659 self._verbosenote = lambda s: None
753 self._verbosenote = lambda s: None
660
754
661 def group(self, revs, store, ischangelog, lookup, units=None,
755 def group(self, revs, store, ischangelog, lookup, units=None,
662 clrevtolocalrev=None):
756 clrevtolocalrev=None):
663 """Calculate a delta group, yielding a sequence of changegroup chunks
757 """Calculate a delta group, yielding a sequence of changegroup chunks
664 (strings).
758 (strings).
665
759
666 Given a list of changeset revs, return a set of deltas and
760 Given a list of changeset revs, return a set of deltas and
667 metadata corresponding to nodes. The first delta is
761 metadata corresponding to nodes. The first delta is
668 first parent(nodelist[0]) -> nodelist[0], the receiver is
762 first parent(nodelist[0]) -> nodelist[0], the receiver is
669 guaranteed to have this parent as it has all history before
763 guaranteed to have this parent as it has all history before
670 these changesets. In the case firstparent is nullrev the
764 these changesets. In the case firstparent is nullrev the
671 changegroup starts with a full revision.
765 changegroup starts with a full revision.
672
766
673 If units is not None, progress detail will be generated, units specifies
767 If units is not None, progress detail will be generated, units specifies
674 the type of revlog that is touched (changelog, manifest, etc.).
768 the type of revlog that is touched (changelog, manifest, etc.).
675 """
769 """
676 # if we don't have any revisions touched by these changesets, bail
770 # if we don't have any revisions touched by these changesets, bail
677 if len(revs) == 0:
771 if len(revs) == 0:
678 yield closechunk()
772 yield closechunk()
679 return
773 return
680
774
681 cl = self._repo.changelog
775 cl = self._repo.changelog
682
776
683 # add the parent of the first rev
777 # add the parent of the first rev
684 p = store.parentrevs(revs[0])[0]
778 p = store.parentrevs(revs[0])[0]
685 revs.insert(0, p)
779 revs.insert(0, p)
686
780
687 # build deltas
781 # build deltas
688 progress = None
782 progress = None
689 if units is not None:
783 if units is not None:
690 progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
784 progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
691 total=(len(revs) - 1))
785 total=(len(revs) - 1))
692 for r in pycompat.xrange(len(revs) - 1):
786 for r in pycompat.xrange(len(revs) - 1):
693 if progress:
787 if progress:
694 progress.update(r + 1)
788 progress.update(r + 1)
695 prev, curr = revs[r], revs[r + 1]
789 prev, curr = revs[r], revs[r + 1]
696 linknode = lookup(store.node(curr))
790 linknode = lookup(store.node(curr))
697
791
698 if self._ellipses:
792 if self._ellipses:
699 linkrev = cl.rev(linknode)
793 linkrev = cl.rev(linknode)
700 clrevtolocalrev[linkrev] = curr
794 clrevtolocalrev[linkrev] = curr
701
795
702 # This is a node to send in full, because the changeset it
796 # This is a node to send in full, because the changeset it
703 # corresponds to was a full changeset.
797 # corresponds to was a full changeset.
704 if linknode in self._fullclnodes:
798 if linknode in self._fullclnodes:
705 delta = _revisiondeltanormal(store, curr, prev, linknode,
799 delta = _revisiondeltanormal(store, curr, prev, linknode,
706 self._deltaparentfn)
800 self._deltaparentfn)
707 elif linkrev not in self._precomputedellipsis:
801 elif linkrev not in self._precomputedellipsis:
708 delta = None
802 delta = None
709 else:
803 else:
710 delta = self._revisiondeltanarrow(
804 delta = _revisiondeltanarrow(
711 cl, store, ischangelog, curr, linkrev, linknode,
805 cl, store, ischangelog, curr, linkrev, linknode,
712 clrevtolocalrev, self._fullclnodes,
806 clrevtolocalrev, self._fullclnodes,
713 self._precomputedellipsis)
807 self._precomputedellipsis)
714 else:
808 else:
715 delta = _revisiondeltanormal(store, curr, prev, linknode,
809 delta = _revisiondeltanormal(store, curr, prev, linknode,
716 self._deltaparentfn)
810 self._deltaparentfn)
717
811
718 if not delta:
812 if not delta:
719 continue
813 continue
720
814
721 meta = self._builddeltaheader(delta)
815 meta = self._builddeltaheader(delta)
722 l = len(meta) + sum(len(x) for x in delta.deltachunks)
816 l = len(meta) + sum(len(x) for x in delta.deltachunks)
723 yield chunkheader(l)
817 yield chunkheader(l)
724 yield meta
818 yield meta
725 for x in delta.deltachunks:
819 for x in delta.deltachunks:
726 yield x
820 yield x
727
821
728 if progress:
822 if progress:
729 progress.complete()
823 progress.complete()
730
824
731 yield closechunk()
825 yield closechunk()
732
826
733 # filter any nodes that claim to be part of the known set
827 # filter any nodes that claim to be part of the known set
734 def _prune(self, store, missing, commonrevs):
828 def _prune(self, store, missing, commonrevs):
735 # TODO this violates storage abstraction for manifests.
829 # TODO this violates storage abstraction for manifests.
736 if isinstance(store, manifest.manifestrevlog):
830 if isinstance(store, manifest.manifestrevlog):
737 if not self._filematcher.visitdir(store._dir[:-1] or '.'):
831 if not self._filematcher.visitdir(store._dir[:-1] or '.'):
738 return []
832 return []
739
833
740 rr, rl = store.rev, store.linkrev
834 rr, rl = store.rev, store.linkrev
741 return [n for n in missing if rl(rr(n)) not in commonrevs]
835 return [n for n in missing if rl(rr(n)) not in commonrevs]
742
836
743 def _packmanifests(self, dir, dirlog, revs, lookuplinknode,
837 def _packmanifests(self, dir, dirlog, revs, lookuplinknode,
744 clrevtolocalrev):
838 clrevtolocalrev):
745 """Pack manifests into a changegroup stream.
839 """Pack manifests into a changegroup stream.
746
840
747 Encodes the directory name in the output so multiple manifests
841 Encodes the directory name in the output so multiple manifests
748 can be sent. Multiple manifests is not supported by cg1 and cg2.
842 can be sent. Multiple manifests is not supported by cg1 and cg2.
749 """
843 """
750 if dir:
844 if dir:
751 assert self.version == b'03'
845 assert self.version == b'03'
752 yield _fileheader(dir)
846 yield _fileheader(dir)
753
847
754 for chunk in self.group(revs, dirlog, False, lookuplinknode,
848 for chunk in self.group(revs, dirlog, False, lookuplinknode,
755 units=_('manifests'),
849 units=_('manifests'),
756 clrevtolocalrev=clrevtolocalrev):
850 clrevtolocalrev=clrevtolocalrev):
757 yield chunk
851 yield chunk
758
852
759 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
853 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
760 """Yield a sequence of changegroup byte chunks."""
854 """Yield a sequence of changegroup byte chunks."""
761
855
762 repo = self._repo
856 repo = self._repo
763 cl = repo.changelog
857 cl = repo.changelog
764
858
765 self._verbosenote(_('uncompressed size of bundle content:\n'))
859 self._verbosenote(_('uncompressed size of bundle content:\n'))
766 size = 0
860 size = 0
767
861
768 clstate, chunks = self._generatechangelog(cl, clnodes)
862 clstate, chunks = self._generatechangelog(cl, clnodes)
769 for chunk in chunks:
863 for chunk in chunks:
770 size += len(chunk)
864 size += len(chunk)
771 yield chunk
865 yield chunk
772
866
773 self._verbosenote(_('%8.i (changelog)\n') % size)
867 self._verbosenote(_('%8.i (changelog)\n') % size)
774
868
775 clrevorder = clstate['clrevorder']
869 clrevorder = clstate['clrevorder']
776 mfs = clstate['mfs']
870 mfs = clstate['mfs']
777 changedfiles = clstate['changedfiles']
871 changedfiles = clstate['changedfiles']
778
872
779 # We need to make sure that the linkrev in the changegroup refers to
873 # We need to make sure that the linkrev in the changegroup refers to
780 # the first changeset that introduced the manifest or file revision.
874 # the first changeset that introduced the manifest or file revision.
781 # The fastpath is usually safer than the slowpath, because the filelogs
875 # The fastpath is usually safer than the slowpath, because the filelogs
782 # are walked in revlog order.
876 # are walked in revlog order.
783 #
877 #
784 # When taking the slowpath with reorder=None and the manifest revlog
878 # When taking the slowpath with reorder=None and the manifest revlog
785 # uses generaldelta, the manifest may be walked in the "wrong" order.
879 # uses generaldelta, the manifest may be walked in the "wrong" order.
786 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
880 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
787 # cc0ff93d0c0c).
881 # cc0ff93d0c0c).
788 #
882 #
789 # When taking the fastpath, we are only vulnerable to reordering
883 # When taking the fastpath, we are only vulnerable to reordering
790 # of the changelog itself. The changelog never uses generaldelta, so
884 # of the changelog itself. The changelog never uses generaldelta, so
791 # it is only reordered when reorder=True. To handle this case, we
885 # it is only reordered when reorder=True. To handle this case, we
792 # simply take the slowpath, which already has the 'clrevorder' logic.
886 # simply take the slowpath, which already has the 'clrevorder' logic.
793 # This was also fixed in cc0ff93d0c0c.
887 # This was also fixed in cc0ff93d0c0c.
794 fastpathlinkrev = fastpathlinkrev and not self._reorder
888 fastpathlinkrev = fastpathlinkrev and not self._reorder
795 # Treemanifests don't work correctly with fastpathlinkrev
889 # Treemanifests don't work correctly with fastpathlinkrev
796 # either, because we don't discover which directory nodes to
890 # either, because we don't discover which directory nodes to
797 # send along with files. This could probably be fixed.
891 # send along with files. This could probably be fixed.
798 fastpathlinkrev = fastpathlinkrev and (
892 fastpathlinkrev = fastpathlinkrev and (
799 'treemanifest' not in repo.requirements)
893 'treemanifest' not in repo.requirements)
800
894
801 fnodes = {} # needed file nodes
895 fnodes = {} # needed file nodes
802
896
803 for chunk in self.generatemanifests(commonrevs, clrevorder,
897 for chunk in self.generatemanifests(commonrevs, clrevorder,
804 fastpathlinkrev, mfs, fnodes, source,
898 fastpathlinkrev, mfs, fnodes, source,
805 clstate['clrevtomanifestrev']):
899 clstate['clrevtomanifestrev']):
806 yield chunk
900 yield chunk
807
901
808 mfdicts = None
902 mfdicts = None
809 if self._ellipses and self._isshallow:
903 if self._ellipses and self._isshallow:
810 mfdicts = [(self._repo.manifestlog[n].read(), lr)
904 mfdicts = [(self._repo.manifestlog[n].read(), lr)
811 for (n, lr) in mfs.iteritems()]
905 for (n, lr) in mfs.iteritems()]
812
906
813 mfs.clear()
907 mfs.clear()
814 clrevs = set(cl.rev(x) for x in clnodes)
908 clrevs = set(cl.rev(x) for x in clnodes)
815
909
816 for chunk in self.generatefiles(changedfiles, commonrevs,
910 for chunk in self.generatefiles(changedfiles, commonrevs,
817 source, mfdicts, fastpathlinkrev,
911 source, mfdicts, fastpathlinkrev,
818 fnodes, clrevs):
912 fnodes, clrevs):
819 yield chunk
913 yield chunk
820
914
821 yield closechunk()
915 yield closechunk()
822
916
823 if clnodes:
917 if clnodes:
824 repo.hook('outgoing', node=hex(clnodes[0]), source=source)
918 repo.hook('outgoing', node=hex(clnodes[0]), source=source)
825
919
826 def _generatechangelog(self, cl, nodes):
920 def _generatechangelog(self, cl, nodes):
827 """Generate data for changelog chunks.
921 """Generate data for changelog chunks.
828
922
829 Returns a 2-tuple of a dict containing state and an iterable of
923 Returns a 2-tuple of a dict containing state and an iterable of
830 byte chunks. The state will not be fully populated until the
924 byte chunks. The state will not be fully populated until the
831 chunk stream has been fully consumed.
925 chunk stream has been fully consumed.
832 """
926 """
833 clrevorder = {}
927 clrevorder = {}
834 mfs = {} # needed manifests
928 mfs = {} # needed manifests
835 mfl = self._repo.manifestlog
929 mfl = self._repo.manifestlog
836 # TODO violates storage abstraction.
930 # TODO violates storage abstraction.
837 mfrevlog = mfl._revlog
931 mfrevlog = mfl._revlog
838 changedfiles = set()
932 changedfiles = set()
839 clrevtomanifestrev = {}
933 clrevtomanifestrev = {}
840
934
841 # Callback for the changelog, used to collect changed files and
935 # Callback for the changelog, used to collect changed files and
842 # manifest nodes.
936 # manifest nodes.
843 # Returns the linkrev node (identity in the changelog case).
937 # Returns the linkrev node (identity in the changelog case).
844 def lookupcl(x):
938 def lookupcl(x):
845 c = cl.read(x)
939 c = cl.read(x)
846 clrevorder[x] = len(clrevorder)
940 clrevorder[x] = len(clrevorder)
847
941
848 if self._ellipses:
942 if self._ellipses:
849 # Only update mfs if x is going to be sent. Otherwise we
943 # Only update mfs if x is going to be sent. Otherwise we
850 # end up with bogus linkrevs specified for manifests and
944 # end up with bogus linkrevs specified for manifests and
851 # we skip some manifest nodes that we should otherwise
945 # we skip some manifest nodes that we should otherwise
852 # have sent.
946 # have sent.
853 if (x in self._fullclnodes
947 if (x in self._fullclnodes
854 or cl.rev(x) in self._precomputedellipsis):
948 or cl.rev(x) in self._precomputedellipsis):
855 n = c[0]
949 n = c[0]
856 # Record the first changeset introducing this manifest
950 # Record the first changeset introducing this manifest
857 # version.
951 # version.
858 mfs.setdefault(n, x)
952 mfs.setdefault(n, x)
859 # Set this narrow-specific dict so we have the lowest
953 # Set this narrow-specific dict so we have the lowest
860 # manifest revnum to look up for this cl revnum. (Part of
954 # manifest revnum to look up for this cl revnum. (Part of
861 # mapping changelog ellipsis parents to manifest ellipsis
955 # mapping changelog ellipsis parents to manifest ellipsis
862 # parents)
956 # parents)
863 clrevtomanifestrev.setdefault(cl.rev(x), mfrevlog.rev(n))
957 clrevtomanifestrev.setdefault(cl.rev(x), mfrevlog.rev(n))
864 # We can't trust the changed files list in the changeset if the
958 # We can't trust the changed files list in the changeset if the
865 # client requested a shallow clone.
959 # client requested a shallow clone.
866 if self._isshallow:
960 if self._isshallow:
867 changedfiles.update(mfl[c[0]].read().keys())
961 changedfiles.update(mfl[c[0]].read().keys())
868 else:
962 else:
869 changedfiles.update(c[3])
963 changedfiles.update(c[3])
870 else:
964 else:
871
965
872 n = c[0]
966 n = c[0]
873 # record the first changeset introducing this manifest version
967 # record the first changeset introducing this manifest version
874 mfs.setdefault(n, x)
968 mfs.setdefault(n, x)
875 # Record a complete list of potentially-changed files in
969 # Record a complete list of potentially-changed files in
876 # this manifest.
970 # this manifest.
877 changedfiles.update(c[3])
971 changedfiles.update(c[3])
878
972
879 return x
973 return x
880
974
881 # Changelog doesn't benefit from reordering revisions. So send out
975 # Changelog doesn't benefit from reordering revisions. So send out
882 # revisions in store order.
976 # revisions in store order.
883 revs = sorted(cl.rev(n) for n in nodes)
977 revs = sorted(cl.rev(n) for n in nodes)
884
978
885 state = {
979 state = {
886 'clrevorder': clrevorder,
980 'clrevorder': clrevorder,
887 'mfs': mfs,
981 'mfs': mfs,
888 'changedfiles': changedfiles,
982 'changedfiles': changedfiles,
889 'clrevtomanifestrev': clrevtomanifestrev,
983 'clrevtomanifestrev': clrevtomanifestrev,
890 }
984 }
891
985
892 gen = self.group(revs, cl, True, lookupcl, units=_('changesets'),
986 gen = self.group(revs, cl, True, lookupcl, units=_('changesets'),
893 clrevtolocalrev={})
987 clrevtolocalrev={})
894
988
895 return state, gen
989 return state, gen
896
990
897 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
991 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
898 fnodes, source, clrevtolocalrev):
992 fnodes, source, clrevtolocalrev):
899 """Returns an iterator of changegroup chunks containing manifests.
993 """Returns an iterator of changegroup chunks containing manifests.
900
994
901 `source` is unused here, but is used by extensions like remotefilelog to
995 `source` is unused here, but is used by extensions like remotefilelog to
902 change what is sent based in pulls vs pushes, etc.
996 change what is sent based in pulls vs pushes, etc.
903 """
997 """
904 repo = self._repo
998 repo = self._repo
905 cl = repo.changelog
999 cl = repo.changelog
906 mfl = repo.manifestlog
1000 mfl = repo.manifestlog
907 dirlog = mfl._revlog.dirlog
1001 dirlog = mfl._revlog.dirlog
908 tmfnodes = {'': mfs}
1002 tmfnodes = {'': mfs}
909
1003
910 # Callback for the manifest, used to collect linkrevs for filelog
1004 # Callback for the manifest, used to collect linkrevs for filelog
911 # revisions.
1005 # revisions.
912 # Returns the linkrev node (collected in lookupcl).
1006 # Returns the linkrev node (collected in lookupcl).
913 def makelookupmflinknode(dir, nodes):
1007 def makelookupmflinknode(dir, nodes):
914 if fastpathlinkrev:
1008 if fastpathlinkrev:
915 assert not dir
1009 assert not dir
916 return mfs.__getitem__
1010 return mfs.__getitem__
917
1011
918 def lookupmflinknode(x):
1012 def lookupmflinknode(x):
919 """Callback for looking up the linknode for manifests.
1013 """Callback for looking up the linknode for manifests.
920
1014
921 Returns the linkrev node for the specified manifest.
1015 Returns the linkrev node for the specified manifest.
922
1016
923 SIDE EFFECT:
1017 SIDE EFFECT:
924
1018
925 1) fclnodes gets populated with the list of relevant
1019 1) fclnodes gets populated with the list of relevant
926 file nodes if we're not using fastpathlinkrev
1020 file nodes if we're not using fastpathlinkrev
927 2) When treemanifests are in use, collects treemanifest nodes
1021 2) When treemanifests are in use, collects treemanifest nodes
928 to send
1022 to send
929
1023
930 Note that this means manifests must be completely sent to
1024 Note that this means manifests must be completely sent to
931 the client before you can trust the list of files and
1025 the client before you can trust the list of files and
932 treemanifests to send.
1026 treemanifests to send.
933 """
1027 """
934 clnode = nodes[x]
1028 clnode = nodes[x]
935 mdata = mfl.get(dir, x).readfast(shallow=True)
1029 mdata = mfl.get(dir, x).readfast(shallow=True)
936 for p, n, fl in mdata.iterentries():
1030 for p, n, fl in mdata.iterentries():
937 if fl == 't': # subdirectory manifest
1031 if fl == 't': # subdirectory manifest
938 subdir = dir + p + '/'
1032 subdir = dir + p + '/'
939 tmfclnodes = tmfnodes.setdefault(subdir, {})
1033 tmfclnodes = tmfnodes.setdefault(subdir, {})
940 tmfclnode = tmfclnodes.setdefault(n, clnode)
1034 tmfclnode = tmfclnodes.setdefault(n, clnode)
941 if clrevorder[clnode] < clrevorder[tmfclnode]:
1035 if clrevorder[clnode] < clrevorder[tmfclnode]:
942 tmfclnodes[n] = clnode
1036 tmfclnodes[n] = clnode
943 else:
1037 else:
944 f = dir + p
1038 f = dir + p
945 fclnodes = fnodes.setdefault(f, {})
1039 fclnodes = fnodes.setdefault(f, {})
946 fclnode = fclnodes.setdefault(n, clnode)
1040 fclnode = fclnodes.setdefault(n, clnode)
947 if clrevorder[clnode] < clrevorder[fclnode]:
1041 if clrevorder[clnode] < clrevorder[fclnode]:
948 fclnodes[n] = clnode
1042 fclnodes[n] = clnode
949 return clnode
1043 return clnode
950 return lookupmflinknode
1044 return lookupmflinknode
951
1045
952 size = 0
1046 size = 0
953 while tmfnodes:
1047 while tmfnodes:
954 dir, nodes = tmfnodes.popitem()
1048 dir, nodes = tmfnodes.popitem()
955 store = dirlog(dir)
1049 store = dirlog(dir)
956 prunednodes = self._prune(store, nodes, commonrevs)
1050 prunednodes = self._prune(store, nodes, commonrevs)
957 if not dir or prunednodes:
1051 if not dir or prunednodes:
958 lookupfn = makelookupmflinknode(dir, nodes)
1052 lookupfn = makelookupmflinknode(dir, nodes)
959
1053
960 if self._ellipses:
1054 if self._ellipses:
961 revs = _sortnodesellipsis(store, prunednodes, cl,
1055 revs = _sortnodesellipsis(store, prunednodes, cl,
962 lookupfn)
1056 lookupfn)
963 else:
1057 else:
964 revs = _sortnodesnormal(store, prunednodes,
1058 revs = _sortnodesnormal(store, prunednodes,
965 self._reorder)
1059 self._reorder)
966
1060
967 for x in self._packmanifests(dir, store, revs, lookupfn,
1061 for x in self._packmanifests(dir, store, revs, lookupfn,
968 clrevtolocalrev):
1062 clrevtolocalrev):
969 size += len(x)
1063 size += len(x)
970 yield x
1064 yield x
971 self._verbosenote(_('%8.i (manifests)\n') % size)
1065 self._verbosenote(_('%8.i (manifests)\n') % size)
972 yield self._manifestsend
1066 yield self._manifestsend
973
1067
974 # The 'source' parameter is useful for extensions
1068 # The 'source' parameter is useful for extensions
975 def generatefiles(self, changedfiles, commonrevs, source,
1069 def generatefiles(self, changedfiles, commonrevs, source,
976 mfdicts, fastpathlinkrev, fnodes, clrevs):
1070 mfdicts, fastpathlinkrev, fnodes, clrevs):
977 changedfiles = list(filter(self._filematcher, changedfiles))
1071 changedfiles = list(filter(self._filematcher, changedfiles))
978
1072
979 if not fastpathlinkrev:
1073 if not fastpathlinkrev:
980 def normallinknodes(unused, fname):
1074 def normallinknodes(unused, fname):
981 return fnodes.get(fname, {})
1075 return fnodes.get(fname, {})
982 else:
1076 else:
983 cln = self._repo.changelog.node
1077 cln = self._repo.changelog.node
984
1078
985 def normallinknodes(store, fname):
1079 def normallinknodes(store, fname):
986 flinkrev = store.linkrev
1080 flinkrev = store.linkrev
987 fnode = store.node
1081 fnode = store.node
988 revs = ((r, flinkrev(r)) for r in store)
1082 revs = ((r, flinkrev(r)) for r in store)
989 return dict((fnode(r), cln(lr))
1083 return dict((fnode(r), cln(lr))
990 for r, lr in revs if lr in clrevs)
1084 for r, lr in revs if lr in clrevs)
991
1085
992 clrevtolocalrev = {}
1086 clrevtolocalrev = {}
993
1087
994 if self._isshallow:
1088 if self._isshallow:
995 # In a shallow clone, the linknodes callback needs to also include
1089 # In a shallow clone, the linknodes callback needs to also include
996 # those file nodes that are in the manifests we sent but weren't
1090 # those file nodes that are in the manifests we sent but weren't
997 # introduced by those manifests.
1091 # introduced by those manifests.
998 commonctxs = [self._repo[c] for c in commonrevs]
1092 commonctxs = [self._repo[c] for c in commonrevs]
999 clrev = self._repo.changelog.rev
1093 clrev = self._repo.changelog.rev
1000
1094
1001 # Defining this function has a side-effect of overriding the
1095 # Defining this function has a side-effect of overriding the
1002 # function of the same name that was passed in as an argument.
1096 # function of the same name that was passed in as an argument.
1003 # TODO have caller pass in appropriate function.
1097 # TODO have caller pass in appropriate function.
1004 def linknodes(flog, fname):
1098 def linknodes(flog, fname):
1005 for c in commonctxs:
1099 for c in commonctxs:
1006 try:
1100 try:
1007 fnode = c.filenode(fname)
1101 fnode = c.filenode(fname)
1008 clrevtolocalrev[c.rev()] = flog.rev(fnode)
1102 clrevtolocalrev[c.rev()] = flog.rev(fnode)
1009 except error.ManifestLookupError:
1103 except error.ManifestLookupError:
1010 pass
1104 pass
1011 links = normallinknodes(flog, fname)
1105 links = normallinknodes(flog, fname)
1012 if len(links) != len(mfdicts):
1106 if len(links) != len(mfdicts):
1013 for mf, lr in mfdicts:
1107 for mf, lr in mfdicts:
1014 fnode = mf.get(fname, None)
1108 fnode = mf.get(fname, None)
1015 if fnode in links:
1109 if fnode in links:
1016 links[fnode] = min(links[fnode], lr, key=clrev)
1110 links[fnode] = min(links[fnode], lr, key=clrev)
1017 elif fnode:
1111 elif fnode:
1018 links[fnode] = lr
1112 links[fnode] = lr
1019 return links
1113 return links
1020 else:
1114 else:
1021 linknodes = normallinknodes
1115 linknodes = normallinknodes
1022
1116
1023 repo = self._repo
1117 repo = self._repo
1024 cl = repo.changelog
1118 cl = repo.changelog
1025 progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
1119 progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
1026 total=len(changedfiles))
1120 total=len(changedfiles))
1027 for i, fname in enumerate(sorted(changedfiles)):
1121 for i, fname in enumerate(sorted(changedfiles)):
1028 filerevlog = repo.file(fname)
1122 filerevlog = repo.file(fname)
1029 if not filerevlog:
1123 if not filerevlog:
1030 raise error.Abort(_("empty or missing file data for %s") %
1124 raise error.Abort(_("empty or missing file data for %s") %
1031 fname)
1125 fname)
1032
1126
1033 clrevtolocalrev.clear()
1127 clrevtolocalrev.clear()
1034
1128
1035 linkrevnodes = linknodes(filerevlog, fname)
1129 linkrevnodes = linknodes(filerevlog, fname)
1036 # Lookup for filenodes, we collected the linkrev nodes above in the
1130 # Lookup for filenodes, we collected the linkrev nodes above in the
1037 # fastpath case and with lookupmf in the slowpath case.
1131 # fastpath case and with lookupmf in the slowpath case.
1038 def lookupfilelog(x):
1132 def lookupfilelog(x):
1039 return linkrevnodes[x]
1133 return linkrevnodes[x]
1040
1134
1041 filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)
1135 filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)
1042 if filenodes:
1136 if filenodes:
1043 if self._ellipses:
1137 if self._ellipses:
1044 revs = _sortnodesellipsis(filerevlog, filenodes,
1138 revs = _sortnodesellipsis(filerevlog, filenodes,
1045 cl, lookupfilelog)
1139 cl, lookupfilelog)
1046 else:
1140 else:
1047 revs = _sortnodesnormal(filerevlog, filenodes,
1141 revs = _sortnodesnormal(filerevlog, filenodes,
1048 self._reorder)
1142 self._reorder)
1049
1143
1050 progress.update(i + 1, item=fname)
1144 progress.update(i + 1, item=fname)
1051 h = _fileheader(fname)
1145 h = _fileheader(fname)
1052 size = len(h)
1146 size = len(h)
1053 yield h
1147 yield h
1054 for chunk in self.group(revs, filerevlog, False, lookupfilelog,
1148 for chunk in self.group(revs, filerevlog, False, lookupfilelog,
1055 clrevtolocalrev=clrevtolocalrev):
1149 clrevtolocalrev=clrevtolocalrev):
1056 size += len(chunk)
1150 size += len(chunk)
1057 yield chunk
1151 yield chunk
1058 self._verbosenote(_('%8.i %s\n') % (size, fname))
1152 self._verbosenote(_('%8.i %s\n') % (size, fname))
1059 progress.complete()
1153 progress.complete()
1060
1154
1061 def _revisiondeltanarrow(self, cl, store, ischangelog, rev, linkrev,
1062 linknode, clrevtolocalrev, fullclnodes,
1063 precomputedellipsis):
1064 linkparents = precomputedellipsis[linkrev]
1065 def local(clrev):
1066 """Turn a changelog revnum into a local revnum.
1067
1068 The ellipsis dag is stored as revnums on the changelog,
1069 but when we're producing ellipsis entries for
1070 non-changelog revlogs, we need to turn those numbers into
1071 something local. This does that for us, and during the
1072 changelog sending phase will also expand the stored
1073 mappings as needed.
1074 """
1075 if clrev == nullrev:
1076 return nullrev
1077
1078 if ischangelog:
1079 return clrev
1080
1081 # Walk the ellipsis-ized changelog breadth-first looking for a
1082 # change that has been linked from the current revlog.
1083 #
1084 # For a flat manifest revlog only a single step should be necessary
1085 # as all relevant changelog entries are relevant to the flat
1086 # manifest.
1087 #
1088 # For a filelog or tree manifest dirlog however not every changelog
1089 # entry will have been relevant, so we need to skip some changelog
1090 # nodes even after ellipsis-izing.
1091 walk = [clrev]
1092 while walk:
1093 p = walk[0]
1094 walk = walk[1:]
1095 if p in clrevtolocalrev:
1096 return clrevtolocalrev[p]
1097 elif p in fullclnodes:
1098 walk.extend([pp for pp in cl.parentrevs(p)
1099 if pp != nullrev])
1100 elif p in precomputedellipsis:
1101 walk.extend([pp for pp in precomputedellipsis[p]
1102 if pp != nullrev])
1103 else:
1104 # In this case, we've got an ellipsis with parents
1105 # outside the current bundle (likely an
1106 # incremental pull). We "know" that we can use the
1107 # value of this same revlog at whatever revision
1108 # is pointed to by linknode. "Know" is in scare
1109 # quotes because I haven't done enough examination
1110 # of edge cases to convince myself this is really
1111 # a fact - it works for all the (admittedly
1112 # thorough) cases in our testsuite, but I would be
1113 # somewhat unsurprised to find a case in the wild
1114 # where this breaks down a bit. That said, I don't
1115 # know if it would hurt anything.
1116 for i in pycompat.xrange(rev, 0, -1):
1117 if store.linkrev(i) == clrev:
1118 return i
1119 # We failed to resolve a parent for this node, so
1120 # we crash the changegroup construction.
1121 raise error.Abort(
1122 'unable to resolve parent while packing %r %r'
1123 ' for changeset %r' % (store.indexfile, rev, clrev))
1124
1125 return nullrev
1126
1127 if not linkparents or (
1128 store.parentrevs(rev) == (nullrev, nullrev)):
1129 p1, p2 = nullrev, nullrev
1130 elif len(linkparents) == 1:
1131 p1, = sorted(local(p) for p in linkparents)
1132 p2 = nullrev
1133 else:
1134 p1, p2 = sorted(local(p) for p in linkparents)
1135
1136 n = store.node(rev)
1137 p1n, p2n = store.node(p1), store.node(p2)
1138 flags = store.flags(rev)
1139 flags |= revlog.REVIDX_ELLIPSIS
1140
1141 # TODO: try and actually send deltas for ellipsis data blocks
1142 data = store.revision(n)
1143 diffheader = mdiff.trivialdiffheader(len(data))
1144
1145 return revisiondelta(
1146 node=n,
1147 p1node=p1n,
1148 p2node=p2n,
1149 basenode=nullid,
1150 linknode=linknode,
1151 flags=flags,
1152 deltachunks=(diffheader, data),
1153 )
1154
1155 def _deltaparentprev(store, rev, p1, p2, prev):
1155 def _deltaparentprev(store, rev, p1, p2, prev):
1156 """Resolve a delta parent to the previous revision.
1156 """Resolve a delta parent to the previous revision.
1157
1157
1158 Used for version 1 changegroups, which don't support generaldelta.
1158 Used for version 1 changegroups, which don't support generaldelta.
1159 """
1159 """
1160 return prev
1160 return prev
1161
1161
1162 def _deltaparentgeneraldelta(store, rev, p1, p2, prev):
1162 def _deltaparentgeneraldelta(store, rev, p1, p2, prev):
1163 """Resolve a delta parent when general deltas are supported."""
1163 """Resolve a delta parent when general deltas are supported."""
1164 dp = store.deltaparent(rev)
1164 dp = store.deltaparent(rev)
1165 if dp == nullrev and store.storedeltachains:
1165 if dp == nullrev and store.storedeltachains:
1166 # Avoid sending full revisions when delta parent is null. Pick prev
1166 # Avoid sending full revisions when delta parent is null. Pick prev
1167 # in that case. It's tempting to pick p1 in this case, as p1 will
1167 # in that case. It's tempting to pick p1 in this case, as p1 will
1168 # be smaller in the common case. However, computing a delta against
1168 # be smaller in the common case. However, computing a delta against
1169 # p1 may require resolving the raw text of p1, which could be
1169 # p1 may require resolving the raw text of p1, which could be
1170 # expensive. The revlog caches should have prev cached, meaning
1170 # expensive. The revlog caches should have prev cached, meaning
1171 # less CPU for changegroup generation. There is likely room to add
1171 # less CPU for changegroup generation. There is likely room to add
1172 # a flag and/or config option to control this behavior.
1172 # a flag and/or config option to control this behavior.
1173 base = prev
1173 base = prev
1174 elif dp == nullrev:
1174 elif dp == nullrev:
1175 # revlog is configured to use full snapshot for a reason,
1175 # revlog is configured to use full snapshot for a reason,
1176 # stick to full snapshot.
1176 # stick to full snapshot.
1177 base = nullrev
1177 base = nullrev
1178 elif dp not in (p1, p2, prev):
1178 elif dp not in (p1, p2, prev):
1179 # Pick prev when we can't be sure remote has the base revision.
1179 # Pick prev when we can't be sure remote has the base revision.
1180 return prev
1180 return prev
1181 else:
1181 else:
1182 base = dp
1182 base = dp
1183
1183
1184 if base != nullrev and not store.candelta(base, rev):
1184 if base != nullrev and not store.candelta(base, rev):
1185 base = nullrev
1185 base = nullrev
1186
1186
1187 return base
1187 return base
1188
1188
1189 def _deltaparentellipses(store, rev, p1, p2, prev):
1189 def _deltaparentellipses(store, rev, p1, p2, prev):
1190 """Resolve a delta parent when in ellipses mode."""
1190 """Resolve a delta parent when in ellipses mode."""
1191 # TODO: send better deltas when in narrow mode.
1191 # TODO: send better deltas when in narrow mode.
1192 #
1192 #
1193 # changegroup.group() loops over revisions to send,
1193 # changegroup.group() loops over revisions to send,
1194 # including revisions we'll skip. What this means is that
1194 # including revisions we'll skip. What this means is that
1195 # `prev` will be a potentially useless delta base for all
1195 # `prev` will be a potentially useless delta base for all
1196 # ellipsis nodes, as the client likely won't have it. In
1196 # ellipsis nodes, as the client likely won't have it. In
1197 # the future we should do bookkeeping about which nodes
1197 # the future we should do bookkeeping about which nodes
1198 # have been sent to the client, and try to be
1198 # have been sent to the client, and try to be
1199 # significantly smarter about delta bases. This is
1199 # significantly smarter about delta bases. This is
1200 # slightly tricky because this same code has to work for
1200 # slightly tricky because this same code has to work for
1201 # all revlogs, and we don't have the linkrev/linknode here.
1201 # all revlogs, and we don't have the linkrev/linknode here.
1202 return p1
1202 return p1
1203
1203
1204 def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,
1204 def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,
1205 shallow=False, ellipsisroots=None, fullnodes=None):
1205 shallow=False, ellipsisroots=None, fullnodes=None):
1206 builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(
1206 builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(
1207 d.node, d.p1node, d.p2node, d.linknode)
1207 d.node, d.p1node, d.p2node, d.linknode)
1208
1208
1209 return cgpacker(repo, filematcher, b'01',
1209 return cgpacker(repo, filematcher, b'01',
1210 deltaparentfn=_deltaparentprev,
1210 deltaparentfn=_deltaparentprev,
1211 allowreorder=None,
1211 allowreorder=None,
1212 builddeltaheader=builddeltaheader,
1212 builddeltaheader=builddeltaheader,
1213 manifestsend=b'',
1213 manifestsend=b'',
1214 bundlecaps=bundlecaps,
1214 bundlecaps=bundlecaps,
1215 ellipses=ellipses,
1215 ellipses=ellipses,
1216 shallow=shallow,
1216 shallow=shallow,
1217 ellipsisroots=ellipsisroots,
1217 ellipsisroots=ellipsisroots,
1218 fullnodes=fullnodes)
1218 fullnodes=fullnodes)
1219
1219
1220 def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,
1220 def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,
1221 shallow=False, ellipsisroots=None, fullnodes=None):
1221 shallow=False, ellipsisroots=None, fullnodes=None):
1222 builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(
1222 builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(
1223 d.node, d.p1node, d.p2node, d.basenode, d.linknode)
1223 d.node, d.p1node, d.p2node, d.basenode, d.linknode)
1224
1224
1225 # Since generaldelta is directly supported by cg2, reordering
1225 # Since generaldelta is directly supported by cg2, reordering
1226 # generally doesn't help, so we disable it by default (treating
1226 # generally doesn't help, so we disable it by default (treating
1227 # bundle.reorder=auto just like bundle.reorder=False).
1227 # bundle.reorder=auto just like bundle.reorder=False).
1228 return cgpacker(repo, filematcher, b'02',
1228 return cgpacker(repo, filematcher, b'02',
1229 deltaparentfn=_deltaparentgeneraldelta,
1229 deltaparentfn=_deltaparentgeneraldelta,
1230 allowreorder=False,
1230 allowreorder=False,
1231 builddeltaheader=builddeltaheader,
1231 builddeltaheader=builddeltaheader,
1232 manifestsend=b'',
1232 manifestsend=b'',
1233 bundlecaps=bundlecaps,
1233 bundlecaps=bundlecaps,
1234 ellipses=ellipses,
1234 ellipses=ellipses,
1235 shallow=shallow,
1235 shallow=shallow,
1236 ellipsisroots=ellipsisroots,
1236 ellipsisroots=ellipsisroots,
1237 fullnodes=fullnodes)
1237 fullnodes=fullnodes)
1238
1238
1239 def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,
1239 def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,
1240 shallow=False, ellipsisroots=None, fullnodes=None):
1240 shallow=False, ellipsisroots=None, fullnodes=None):
1241 builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(
1241 builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(
1242 d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)
1242 d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)
1243
1243
1244 deltaparentfn = (_deltaparentellipses if ellipses
1244 deltaparentfn = (_deltaparentellipses if ellipses
1245 else _deltaparentgeneraldelta)
1245 else _deltaparentgeneraldelta)
1246
1246
1247 return cgpacker(repo, filematcher, b'03',
1247 return cgpacker(repo, filematcher, b'03',
1248 deltaparentfn=deltaparentfn,
1248 deltaparentfn=deltaparentfn,
1249 allowreorder=False,
1249 allowreorder=False,
1250 builddeltaheader=builddeltaheader,
1250 builddeltaheader=builddeltaheader,
1251 manifestsend=closechunk(),
1251 manifestsend=closechunk(),
1252 bundlecaps=bundlecaps,
1252 bundlecaps=bundlecaps,
1253 ellipses=ellipses,
1253 ellipses=ellipses,
1254 shallow=shallow,
1254 shallow=shallow,
1255 ellipsisroots=ellipsisroots,
1255 ellipsisroots=ellipsisroots,
1256 fullnodes=fullnodes)
1256 fullnodes=fullnodes)
1257
1257
1258 _packermap = {'01': (_makecg1packer, cg1unpacker),
1258 _packermap = {'01': (_makecg1packer, cg1unpacker),
1259 # cg2 adds support for exchanging generaldelta
1259 # cg2 adds support for exchanging generaldelta
1260 '02': (_makecg2packer, cg2unpacker),
1260 '02': (_makecg2packer, cg2unpacker),
1261 # cg3 adds support for exchanging revlog flags and treemanifests
1261 # cg3 adds support for exchanging revlog flags and treemanifests
1262 '03': (_makecg3packer, cg3unpacker),
1262 '03': (_makecg3packer, cg3unpacker),
1263 }
1263 }
1264
1264
1265 def allsupportedversions(repo):
1265 def allsupportedversions(repo):
1266 versions = set(_packermap.keys())
1266 versions = set(_packermap.keys())
1267 if not (repo.ui.configbool('experimental', 'changegroup3') or
1267 if not (repo.ui.configbool('experimental', 'changegroup3') or
1268 repo.ui.configbool('experimental', 'treemanifest') or
1268 repo.ui.configbool('experimental', 'treemanifest') or
1269 'treemanifest' in repo.requirements):
1269 'treemanifest' in repo.requirements):
1270 versions.discard('03')
1270 versions.discard('03')
1271 return versions
1271 return versions
1272
1272
1273 # Changegroup versions that can be applied to the repo
1273 # Changegroup versions that can be applied to the repo
1274 def supportedincomingversions(repo):
1274 def supportedincomingversions(repo):
1275 return allsupportedversions(repo)
1275 return allsupportedversions(repo)
1276
1276
1277 # Changegroup versions that can be created from the repo
1277 # Changegroup versions that can be created from the repo
1278 def supportedoutgoingversions(repo):
1278 def supportedoutgoingversions(repo):
1279 versions = allsupportedversions(repo)
1279 versions = allsupportedversions(repo)
1280 if 'treemanifest' in repo.requirements:
1280 if 'treemanifest' in repo.requirements:
1281 # Versions 01 and 02 support only flat manifests and it's just too
1281 # Versions 01 and 02 support only flat manifests and it's just too
1282 # expensive to convert between the flat manifest and tree manifest on
1282 # expensive to convert between the flat manifest and tree manifest on
1283 # the fly. Since tree manifests are hashed differently, all of history
1283 # the fly. Since tree manifests are hashed differently, all of history
1284 # would have to be converted. Instead, we simply don't even pretend to
1284 # would have to be converted. Instead, we simply don't even pretend to
1285 # support versions 01 and 02.
1285 # support versions 01 and 02.
1286 versions.discard('01')
1286 versions.discard('01')
1287 versions.discard('02')
1287 versions.discard('02')
1288 if repository.NARROW_REQUIREMENT in repo.requirements:
1288 if repository.NARROW_REQUIREMENT in repo.requirements:
1289 # Versions 01 and 02 don't support revlog flags, and we need to
1289 # Versions 01 and 02 don't support revlog flags, and we need to
1290 # support that for stripping and unbundling to work.
1290 # support that for stripping and unbundling to work.
1291 versions.discard('01')
1291 versions.discard('01')
1292 versions.discard('02')
1292 versions.discard('02')
1293 if LFS_REQUIREMENT in repo.requirements:
1293 if LFS_REQUIREMENT in repo.requirements:
1294 # Versions 01 and 02 don't support revlog flags, and we need to
1294 # Versions 01 and 02 don't support revlog flags, and we need to
1295 # mark LFS entries with REVIDX_EXTSTORED.
1295 # mark LFS entries with REVIDX_EXTSTORED.
1296 versions.discard('01')
1296 versions.discard('01')
1297 versions.discard('02')
1297 versions.discard('02')
1298
1298
1299 return versions
1299 return versions
1300
1300
1301 def localversion(repo):
1301 def localversion(repo):
1302 # Finds the best version to use for bundles that are meant to be used
1302 # Finds the best version to use for bundles that are meant to be used
1303 # locally, such as those from strip and shelve, and temporary bundles.
1303 # locally, such as those from strip and shelve, and temporary bundles.
1304 return max(supportedoutgoingversions(repo))
1304 return max(supportedoutgoingversions(repo))
1305
1305
1306 def safeversion(repo):
1306 def safeversion(repo):
1307 # Finds the smallest version that it's safe to assume clients of the repo
1307 # Finds the smallest version that it's safe to assume clients of the repo
1308 # will support. For example, all hg versions that support generaldelta also
1308 # will support. For example, all hg versions that support generaldelta also
1309 # support changegroup 02.
1309 # support changegroup 02.
1310 versions = supportedoutgoingversions(repo)
1310 versions = supportedoutgoingversions(repo)
1311 if 'generaldelta' in repo.requirements:
1311 if 'generaldelta' in repo.requirements:
1312 versions.discard('01')
1312 versions.discard('01')
1313 assert versions
1313 assert versions
1314 return min(versions)
1314 return min(versions)
1315
1315
1316 def getbundler(version, repo, bundlecaps=None, filematcher=None,
1316 def getbundler(version, repo, bundlecaps=None, filematcher=None,
1317 ellipses=False, shallow=False, ellipsisroots=None,
1317 ellipses=False, shallow=False, ellipsisroots=None,
1318 fullnodes=None):
1318 fullnodes=None):
1319 assert version in supportedoutgoingversions(repo)
1319 assert version in supportedoutgoingversions(repo)
1320
1320
1321 if filematcher is None:
1321 if filematcher is None:
1322 filematcher = matchmod.alwaysmatcher(repo.root, '')
1322 filematcher = matchmod.alwaysmatcher(repo.root, '')
1323
1323
1324 if version == '01' and not filematcher.always():
1324 if version == '01' and not filematcher.always():
1325 raise error.ProgrammingError('version 01 changegroups do not support '
1325 raise error.ProgrammingError('version 01 changegroups do not support '
1326 'sparse file matchers')
1326 'sparse file matchers')
1327
1327
1328 if ellipses and version in (b'01', b'02'):
1328 if ellipses and version in (b'01', b'02'):
1329 raise error.Abort(
1329 raise error.Abort(
1330 _('ellipsis nodes require at least cg3 on client and server, '
1330 _('ellipsis nodes require at least cg3 on client and server, '
1331 'but negotiated version %s') % version)
1331 'but negotiated version %s') % version)
1332
1332
1333 # Requested files could include files not in the local store. So
1333 # Requested files could include files not in the local store. So
1334 # filter those out.
1334 # filter those out.
1335 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
1335 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
1336 filematcher)
1336 filematcher)
1337
1337
1338 fn = _packermap[version][0]
1338 fn = _packermap[version][0]
1339 return fn(repo, filematcher, bundlecaps, ellipses=ellipses,
1339 return fn(repo, filematcher, bundlecaps, ellipses=ellipses,
1340 shallow=shallow, ellipsisroots=ellipsisroots,
1340 shallow=shallow, ellipsisroots=ellipsisroots,
1341 fullnodes=fullnodes)
1341 fullnodes=fullnodes)
1342
1342
1343 def getunbundler(version, fh, alg, extras=None):
1343 def getunbundler(version, fh, alg, extras=None):
1344 return _packermap[version][1](fh, alg, extras=extras)
1344 return _packermap[version][1](fh, alg, extras=extras)
1345
1345
1346 def _changegroupinfo(repo, nodes, source):
1346 def _changegroupinfo(repo, nodes, source):
1347 if repo.ui.verbose or source == 'bundle':
1347 if repo.ui.verbose or source == 'bundle':
1348 repo.ui.status(_("%d changesets found\n") % len(nodes))
1348 repo.ui.status(_("%d changesets found\n") % len(nodes))
1349 if repo.ui.debugflag:
1349 if repo.ui.debugflag:
1350 repo.ui.debug("list of changesets:\n")
1350 repo.ui.debug("list of changesets:\n")
1351 for node in nodes:
1351 for node in nodes:
1352 repo.ui.debug("%s\n" % hex(node))
1352 repo.ui.debug("%s\n" % hex(node))
1353
1353
1354 def makechangegroup(repo, outgoing, version, source, fastpath=False,
1354 def makechangegroup(repo, outgoing, version, source, fastpath=False,
1355 bundlecaps=None):
1355 bundlecaps=None):
1356 cgstream = makestream(repo, outgoing, version, source,
1356 cgstream = makestream(repo, outgoing, version, source,
1357 fastpath=fastpath, bundlecaps=bundlecaps)
1357 fastpath=fastpath, bundlecaps=bundlecaps)
1358 return getunbundler(version, util.chunkbuffer(cgstream), None,
1358 return getunbundler(version, util.chunkbuffer(cgstream), None,
1359 {'clcount': len(outgoing.missing) })
1359 {'clcount': len(outgoing.missing) })
1360
1360
1361 def makestream(repo, outgoing, version, source, fastpath=False,
1361 def makestream(repo, outgoing, version, source, fastpath=False,
1362 bundlecaps=None, filematcher=None):
1362 bundlecaps=None, filematcher=None):
1363 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
1363 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
1364 filematcher=filematcher)
1364 filematcher=filematcher)
1365
1365
1366 repo = repo.unfiltered()
1366 repo = repo.unfiltered()
1367 commonrevs = outgoing.common
1367 commonrevs = outgoing.common
1368 csets = outgoing.missing
1368 csets = outgoing.missing
1369 heads = outgoing.missingheads
1369 heads = outgoing.missingheads
1370 # We go through the fast path if we get told to, or if all (unfiltered
1370 # We go through the fast path if we get told to, or if all (unfiltered
1371 # heads have been requested (since we then know there all linkrevs will
1371 # heads have been requested (since we then know there all linkrevs will
1372 # be pulled by the client).
1372 # be pulled by the client).
1373 heads.sort()
1373 heads.sort()
1374 fastpathlinkrev = fastpath or (
1374 fastpathlinkrev = fastpath or (
1375 repo.filtername is None and heads == sorted(repo.heads()))
1375 repo.filtername is None and heads == sorted(repo.heads()))
1376
1376
1377 repo.hook('preoutgoing', throw=True, source=source)
1377 repo.hook('preoutgoing', throw=True, source=source)
1378 _changegroupinfo(repo, csets, source)
1378 _changegroupinfo(repo, csets, source)
1379 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
1379 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
1380
1380
1381 def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
1381 def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
1382 revisions = 0
1382 revisions = 0
1383 files = 0
1383 files = 0
1384 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
1384 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
1385 total=expectedfiles)
1385 total=expectedfiles)
1386 for chunkdata in iter(source.filelogheader, {}):
1386 for chunkdata in iter(source.filelogheader, {}):
1387 files += 1
1387 files += 1
1388 f = chunkdata["filename"]
1388 f = chunkdata["filename"]
1389 repo.ui.debug("adding %s revisions\n" % f)
1389 repo.ui.debug("adding %s revisions\n" % f)
1390 progress.increment()
1390 progress.increment()
1391 fl = repo.file(f)
1391 fl = repo.file(f)
1392 o = len(fl)
1392 o = len(fl)
1393 try:
1393 try:
1394 deltas = source.deltaiter()
1394 deltas = source.deltaiter()
1395 if not fl.addgroup(deltas, revmap, trp):
1395 if not fl.addgroup(deltas, revmap, trp):
1396 raise error.Abort(_("received file revlog group is empty"))
1396 raise error.Abort(_("received file revlog group is empty"))
1397 except error.CensoredBaseError as e:
1397 except error.CensoredBaseError as e:
1398 raise error.Abort(_("received delta base is censored: %s") % e)
1398 raise error.Abort(_("received delta base is censored: %s") % e)
1399 revisions += len(fl) - o
1399 revisions += len(fl) - o
1400 if f in needfiles:
1400 if f in needfiles:
1401 needs = needfiles[f]
1401 needs = needfiles[f]
1402 for new in pycompat.xrange(o, len(fl)):
1402 for new in pycompat.xrange(o, len(fl)):
1403 n = fl.node(new)
1403 n = fl.node(new)
1404 if n in needs:
1404 if n in needs:
1405 needs.remove(n)
1405 needs.remove(n)
1406 else:
1406 else:
1407 raise error.Abort(
1407 raise error.Abort(
1408 _("received spurious file revlog entry"))
1408 _("received spurious file revlog entry"))
1409 if not needs:
1409 if not needs:
1410 del needfiles[f]
1410 del needfiles[f]
1411 progress.complete()
1411 progress.complete()
1412
1412
1413 for f, needs in needfiles.iteritems():
1413 for f, needs in needfiles.iteritems():
1414 fl = repo.file(f)
1414 fl = repo.file(f)
1415 for n in needs:
1415 for n in needs:
1416 try:
1416 try:
1417 fl.rev(n)
1417 fl.rev(n)
1418 except error.LookupError:
1418 except error.LookupError:
1419 raise error.Abort(
1419 raise error.Abort(
1420 _('missing file data for %s:%s - run hg verify') %
1420 _('missing file data for %s:%s - run hg verify') %
1421 (f, hex(n)))
1421 (f, hex(n)))
1422
1422
1423 return revisions, files
1423 return revisions, files
General Comments 0
You need to be logged in to leave comments. Login now