##// END OF EJS Templates
changegroup: move deltaparent() from narrow...
Gregory Szorc -
r38921:5839a170 default
parent child Browse files
Show More
@@ -1,335 +1,318 b''
1 # narrowchangegroup.py - narrow clone changegroup creation and consumption
1 # narrowchangegroup.py - narrow clone changegroup creation and consumption
2 #
2 #
3 # Copyright 2017 Google, Inc.
3 # Copyright 2017 Google, Inc.
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 from mercurial.i18n import _
10 from mercurial.i18n import _
11 from mercurial import (
11 from mercurial import (
12 changegroup,
12 changegroup,
13 error,
13 error,
14 extensions,
14 extensions,
15 node,
15 node,
16 pycompat,
16 pycompat,
17 util,
17 util,
18 )
18 )
19
19
20 def setup():
20 def setup():
21 def generatefiles(orig, self, changedfiles, linknodes, commonrevs,
21 def generatefiles(orig, self, changedfiles, linknodes, commonrevs,
22 source):
22 source):
23 changedfiles = list(filter(self._filematcher, changedfiles))
23 changedfiles = list(filter(self._filematcher, changedfiles))
24
24
25 if getattr(self, 'is_shallow', False):
25 if getattr(self, 'is_shallow', False):
26 # See comment in generate() for why this sadness is a thing.
26 # See comment in generate() for why this sadness is a thing.
27 mfdicts = self._mfdicts
27 mfdicts = self._mfdicts
28 del self._mfdicts
28 del self._mfdicts
29 # In a shallow clone, the linknodes callback needs to also include
29 # In a shallow clone, the linknodes callback needs to also include
30 # those file nodes that are in the manifests we sent but weren't
30 # those file nodes that are in the manifests we sent but weren't
31 # introduced by those manifests.
31 # introduced by those manifests.
32 commonctxs = [self._repo[c] for c in commonrevs]
32 commonctxs = [self._repo[c] for c in commonrevs]
33 oldlinknodes = linknodes
33 oldlinknodes = linknodes
34 clrev = self._repo.changelog.rev
34 clrev = self._repo.changelog.rev
35 def linknodes(flog, fname):
35 def linknodes(flog, fname):
36 for c in commonctxs:
36 for c in commonctxs:
37 try:
37 try:
38 fnode = c.filenode(fname)
38 fnode = c.filenode(fname)
39 self.clrev_to_localrev[c.rev()] = flog.rev(fnode)
39 self.clrev_to_localrev[c.rev()] = flog.rev(fnode)
40 except error.ManifestLookupError:
40 except error.ManifestLookupError:
41 pass
41 pass
42 links = oldlinknodes(flog, fname)
42 links = oldlinknodes(flog, fname)
43 if len(links) != len(mfdicts):
43 if len(links) != len(mfdicts):
44 for mf, lr in mfdicts:
44 for mf, lr in mfdicts:
45 fnode = mf.get(fname, None)
45 fnode = mf.get(fname, None)
46 if fnode in links:
46 if fnode in links:
47 links[fnode] = min(links[fnode], lr, key=clrev)
47 links[fnode] = min(links[fnode], lr, key=clrev)
48 elif fnode:
48 elif fnode:
49 links[fnode] = lr
49 links[fnode] = lr
50 return links
50 return links
51 return orig(self, changedfiles, linknodes, commonrevs, source)
51 return orig(self, changedfiles, linknodes, commonrevs, source)
52 extensions.wrapfunction(
52 extensions.wrapfunction(
53 changegroup.cg1packer, 'generatefiles', generatefiles)
53 changegroup.cg1packer, 'generatefiles', generatefiles)
54
54
55 def close(orig, self):
55 def close(orig, self):
56 getattr(self, 'clrev_to_localrev', {}).clear()
56 getattr(self, 'clrev_to_localrev', {}).clear()
57 if getattr(self, 'next_clrev_to_localrev', {}):
57 if getattr(self, 'next_clrev_to_localrev', {}):
58 self.clrev_to_localrev = self.next_clrev_to_localrev
58 self.clrev_to_localrev = self.next_clrev_to_localrev
59 del self.next_clrev_to_localrev
59 del self.next_clrev_to_localrev
60 self.changelog_done = True
60 self.changelog_done = True
61 return orig(self)
61 return orig(self)
62 extensions.wrapfunction(changegroup.cg1packer, 'close', close)
62 extensions.wrapfunction(changegroup.cg1packer, 'close', close)
63
63
64 # In a perfect world, we'd generate better ellipsis-ified graphs
64 # In a perfect world, we'd generate better ellipsis-ified graphs
65 # for non-changelog revlogs. In practice, we haven't started doing
65 # for non-changelog revlogs. In practice, we haven't started doing
66 # that yet, so the resulting DAGs for the manifestlog and filelogs
66 # that yet, so the resulting DAGs for the manifestlog and filelogs
67 # are actually full of bogus parentage on all the ellipsis
67 # are actually full of bogus parentage on all the ellipsis
68 # nodes. This has the side effect that, while the contents are
68 # nodes. This has the side effect that, while the contents are
69 # correct, the individual DAGs might be completely out of whack in
69 # correct, the individual DAGs might be completely out of whack in
70 # a case like 882681bc3166 and its ancestors (back about 10
70 # a case like 882681bc3166 and its ancestors (back about 10
71 # revisions or so) in the main hg repo.
71 # revisions or so) in the main hg repo.
72 #
72 #
73 # The one invariant we *know* holds is that the new (potentially
73 # The one invariant we *know* holds is that the new (potentially
74 # bogus) DAG shape will be valid if we order the nodes in the
74 # bogus) DAG shape will be valid if we order the nodes in the
75 # order that they're introduced in dramatis personae by the
75 # order that they're introduced in dramatis personae by the
76 # changelog, so what we do is we sort the non-changelog histories
76 # changelog, so what we do is we sort the non-changelog histories
77 # by the order in which they are used by the changelog.
77 # by the order in which they are used by the changelog.
78 def _sortgroup(orig, self, revlog, nodelist, lookup):
78 def _sortgroup(orig, self, revlog, nodelist, lookup):
79 if not util.safehasattr(self, 'full_nodes') or not self.clnode_to_rev:
79 if not util.safehasattr(self, 'full_nodes') or not self.clnode_to_rev:
80 return orig(self, revlog, nodelist, lookup)
80 return orig(self, revlog, nodelist, lookup)
81 key = lambda n: self.clnode_to_rev[lookup(n)]
81 key = lambda n: self.clnode_to_rev[lookup(n)]
82 return [revlog.rev(n) for n in sorted(nodelist, key=key)]
82 return [revlog.rev(n) for n in sorted(nodelist, key=key)]
83
83
84 extensions.wrapfunction(changegroup.cg1packer, '_sortgroup', _sortgroup)
84 extensions.wrapfunction(changegroup.cg1packer, '_sortgroup', _sortgroup)
85
85
86 def generate(orig, self, commonrevs, clnodes, fastpathlinkrev, source):
86 def generate(orig, self, commonrevs, clnodes, fastpathlinkrev, source):
87 '''yield a sequence of changegroup chunks (strings)'''
87 '''yield a sequence of changegroup chunks (strings)'''
88 # Note: other than delegating to orig, the only deviation in
88 # Note: other than delegating to orig, the only deviation in
89 # logic from normal hg's generate is marked with BEGIN/END
89 # logic from normal hg's generate is marked with BEGIN/END
90 # NARROW HACK.
90 # NARROW HACK.
91 if not util.safehasattr(self, 'full_nodes'):
91 if not util.safehasattr(self, 'full_nodes'):
92 # not sending a narrow bundle
92 # not sending a narrow bundle
93 for x in orig(self, commonrevs, clnodes, fastpathlinkrev, source):
93 for x in orig(self, commonrevs, clnodes, fastpathlinkrev, source):
94 yield x
94 yield x
95 return
95 return
96
96
97 repo = self._repo
97 repo = self._repo
98 cl = repo.changelog
98 cl = repo.changelog
99 mfl = repo.manifestlog
99 mfl = repo.manifestlog
100 mfrevlog = mfl._revlog
100 mfrevlog = mfl._revlog
101
101
102 clrevorder = {}
102 clrevorder = {}
103 mfs = {} # needed manifests
103 mfs = {} # needed manifests
104 fnodes = {} # needed file nodes
104 fnodes = {} # needed file nodes
105 changedfiles = set()
105 changedfiles = set()
106
106
107 # Callback for the changelog, used to collect changed files and manifest
107 # Callback for the changelog, used to collect changed files and manifest
108 # nodes.
108 # nodes.
109 # Returns the linkrev node (identity in the changelog case).
109 # Returns the linkrev node (identity in the changelog case).
110 def lookupcl(x):
110 def lookupcl(x):
111 c = cl.read(x)
111 c = cl.read(x)
112 clrevorder[x] = len(clrevorder)
112 clrevorder[x] = len(clrevorder)
113 # BEGIN NARROW HACK
113 # BEGIN NARROW HACK
114 #
114 #
115 # Only update mfs if x is going to be sent. Otherwise we
115 # Only update mfs if x is going to be sent. Otherwise we
116 # end up with bogus linkrevs specified for manifests and
116 # end up with bogus linkrevs specified for manifests and
117 # we skip some manifest nodes that we should otherwise
117 # we skip some manifest nodes that we should otherwise
118 # have sent.
118 # have sent.
119 if x in self.full_nodes or cl.rev(x) in self.precomputed_ellipsis:
119 if x in self.full_nodes or cl.rev(x) in self.precomputed_ellipsis:
120 n = c[0]
120 n = c[0]
121 # record the first changeset introducing this manifest version
121 # record the first changeset introducing this manifest version
122 mfs.setdefault(n, x)
122 mfs.setdefault(n, x)
123 # Set this narrow-specific dict so we have the lowest manifest
123 # Set this narrow-specific dict so we have the lowest manifest
124 # revnum to look up for this cl revnum. (Part of mapping
124 # revnum to look up for this cl revnum. (Part of mapping
125 # changelog ellipsis parents to manifest ellipsis parents)
125 # changelog ellipsis parents to manifest ellipsis parents)
126 self.next_clrev_to_localrev.setdefault(cl.rev(x),
126 self.next_clrev_to_localrev.setdefault(cl.rev(x),
127 mfrevlog.rev(n))
127 mfrevlog.rev(n))
128 # We can't trust the changed files list in the changeset if the
128 # We can't trust the changed files list in the changeset if the
129 # client requested a shallow clone.
129 # client requested a shallow clone.
130 if self.is_shallow:
130 if self.is_shallow:
131 changedfiles.update(mfl[c[0]].read().keys())
131 changedfiles.update(mfl[c[0]].read().keys())
132 else:
132 else:
133 changedfiles.update(c[3])
133 changedfiles.update(c[3])
134 # END NARROW HACK
134 # END NARROW HACK
135 # Record a complete list of potentially-changed files in
135 # Record a complete list of potentially-changed files in
136 # this manifest.
136 # this manifest.
137 return x
137 return x
138
138
139 self._verbosenote(_('uncompressed size of bundle content:\n'))
139 self._verbosenote(_('uncompressed size of bundle content:\n'))
140 size = 0
140 size = 0
141 for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
141 for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
142 size += len(chunk)
142 size += len(chunk)
143 yield chunk
143 yield chunk
144 self._verbosenote(_('%8.i (changelog)\n') % size)
144 self._verbosenote(_('%8.i (changelog)\n') % size)
145
145
146 # We need to make sure that the linkrev in the changegroup refers to
146 # We need to make sure that the linkrev in the changegroup refers to
147 # the first changeset that introduced the manifest or file revision.
147 # the first changeset that introduced the manifest or file revision.
148 # The fastpath is usually safer than the slowpath, because the filelogs
148 # The fastpath is usually safer than the slowpath, because the filelogs
149 # are walked in revlog order.
149 # are walked in revlog order.
150 #
150 #
151 # When taking the slowpath with reorder=None and the manifest revlog
151 # When taking the slowpath with reorder=None and the manifest revlog
152 # uses generaldelta, the manifest may be walked in the "wrong" order.
152 # uses generaldelta, the manifest may be walked in the "wrong" order.
153 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
153 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
154 # cc0ff93d0c0c).
154 # cc0ff93d0c0c).
155 #
155 #
156 # When taking the fastpath, we are only vulnerable to reordering
156 # When taking the fastpath, we are only vulnerable to reordering
157 # of the changelog itself. The changelog never uses generaldelta, so
157 # of the changelog itself. The changelog never uses generaldelta, so
158 # it is only reordered when reorder=True. To handle this case, we
158 # it is only reordered when reorder=True. To handle this case, we
159 # simply take the slowpath, which already has the 'clrevorder' logic.
159 # simply take the slowpath, which already has the 'clrevorder' logic.
160 # This was also fixed in cc0ff93d0c0c.
160 # This was also fixed in cc0ff93d0c0c.
161 fastpathlinkrev = fastpathlinkrev and not self._reorder
161 fastpathlinkrev = fastpathlinkrev and not self._reorder
162 # Treemanifests don't work correctly with fastpathlinkrev
162 # Treemanifests don't work correctly with fastpathlinkrev
163 # either, because we don't discover which directory nodes to
163 # either, because we don't discover which directory nodes to
164 # send along with files. This could probably be fixed.
164 # send along with files. This could probably be fixed.
165 fastpathlinkrev = fastpathlinkrev and (
165 fastpathlinkrev = fastpathlinkrev and (
166 'treemanifest' not in repo.requirements)
166 'treemanifest' not in repo.requirements)
167 # Shallow clones also don't work correctly with fastpathlinkrev
167 # Shallow clones also don't work correctly with fastpathlinkrev
168 # because file nodes may need to be sent for a manifest even if they
168 # because file nodes may need to be sent for a manifest even if they
169 # weren't introduced by that manifest.
169 # weren't introduced by that manifest.
170 fastpathlinkrev = fastpathlinkrev and not self.is_shallow
170 fastpathlinkrev = fastpathlinkrev and not self.is_shallow
171
171
172 for chunk in self.generatemanifests(commonrevs, clrevorder,
172 for chunk in self.generatemanifests(commonrevs, clrevorder,
173 fastpathlinkrev, mfs, fnodes, source):
173 fastpathlinkrev, mfs, fnodes, source):
174 yield chunk
174 yield chunk
175 # BEGIN NARROW HACK
175 # BEGIN NARROW HACK
176 mfdicts = None
176 mfdicts = None
177 if self.is_shallow:
177 if self.is_shallow:
178 mfdicts = [(self._repo.manifestlog[n].read(), lr)
178 mfdicts = [(self._repo.manifestlog[n].read(), lr)
179 for (n, lr) in mfs.iteritems()]
179 for (n, lr) in mfs.iteritems()]
180 # END NARROW HACK
180 # END NARROW HACK
181 mfs.clear()
181 mfs.clear()
182 clrevs = set(cl.rev(x) for x in clnodes)
182 clrevs = set(cl.rev(x) for x in clnodes)
183
183
184 if not fastpathlinkrev:
184 if not fastpathlinkrev:
185 def linknodes(unused, fname):
185 def linknodes(unused, fname):
186 return fnodes.get(fname, {})
186 return fnodes.get(fname, {})
187 else:
187 else:
188 cln = cl.node
188 cln = cl.node
189 def linknodes(filerevlog, fname):
189 def linknodes(filerevlog, fname):
190 llr = filerevlog.linkrev
190 llr = filerevlog.linkrev
191 fln = filerevlog.node
191 fln = filerevlog.node
192 revs = ((r, llr(r)) for r in filerevlog)
192 revs = ((r, llr(r)) for r in filerevlog)
193 return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
193 return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
194
194
195 # BEGIN NARROW HACK
195 # BEGIN NARROW HACK
196 #
196 #
197 # We need to pass the mfdicts variable down into
197 # We need to pass the mfdicts variable down into
198 # generatefiles(), but more than one command might have
198 # generatefiles(), but more than one command might have
199 # wrapped generatefiles so we can't modify the function
199 # wrapped generatefiles so we can't modify the function
200 # signature. Instead, we pass the data to ourselves using an
200 # signature. Instead, we pass the data to ourselves using an
201 # instance attribute. I'm sorry.
201 # instance attribute. I'm sorry.
202 self._mfdicts = mfdicts
202 self._mfdicts = mfdicts
203 # END NARROW HACK
203 # END NARROW HACK
204 for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
204 for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
205 source):
205 source):
206 yield chunk
206 yield chunk
207
207
208 yield self.close()
208 yield self.close()
209
209
210 if clnodes:
210 if clnodes:
211 repo.hook('outgoing', node=node.hex(clnodes[0]), source=source)
211 repo.hook('outgoing', node=node.hex(clnodes[0]), source=source)
212 extensions.wrapfunction(changegroup.cg1packer, 'generate', generate)
212 extensions.wrapfunction(changegroup.cg1packer, 'generate', generate)
213
213
214 def revchunk(orig, self, revlog, rev, prev, linknode):
214 def revchunk(orig, self, revlog, rev, prev, linknode):
215 if not util.safehasattr(self, 'full_nodes'):
215 if not util.safehasattr(self, 'full_nodes'):
216 # not sending a narrow changegroup
216 # not sending a narrow changegroup
217 for x in orig(self, revlog, rev, prev, linknode):
217 for x in orig(self, revlog, rev, prev, linknode):
218 yield x
218 yield x
219 return
219 return
220 # build up some mapping information that's useful later. See
220 # build up some mapping information that's useful later. See
221 # the local() nested function below.
221 # the local() nested function below.
222 if not self.changelog_done:
222 if not self.changelog_done:
223 self.clnode_to_rev[linknode] = rev
223 self.clnode_to_rev[linknode] = rev
224 linkrev = rev
224 linkrev = rev
225 self.clrev_to_localrev[linkrev] = rev
225 self.clrev_to_localrev[linkrev] = rev
226 else:
226 else:
227 linkrev = self.clnode_to_rev[linknode]
227 linkrev = self.clnode_to_rev[linknode]
228 self.clrev_to_localrev[linkrev] = rev
228 self.clrev_to_localrev[linkrev] = rev
229 # This is a node to send in full, because the changeset it
229 # This is a node to send in full, because the changeset it
230 # corresponds to was a full changeset.
230 # corresponds to was a full changeset.
231 if linknode in self.full_nodes:
231 if linknode in self.full_nodes:
232 for x in orig(self, revlog, rev, prev, linknode):
232 for x in orig(self, revlog, rev, prev, linknode):
233 yield x
233 yield x
234 return
234 return
235 # At this point, a node can either be one we should skip or an
235 # At this point, a node can either be one we should skip or an
236 # ellipsis. If it's not an ellipsis, bail immediately.
236 # ellipsis. If it's not an ellipsis, bail immediately.
237 if linkrev not in self.precomputed_ellipsis:
237 if linkrev not in self.precomputed_ellipsis:
238 return
238 return
239 linkparents = self.precomputed_ellipsis[linkrev]
239 linkparents = self.precomputed_ellipsis[linkrev]
240 def local(clrev):
240 def local(clrev):
241 """Turn a changelog revnum into a local revnum.
241 """Turn a changelog revnum into a local revnum.
242
242
243 The ellipsis dag is stored as revnums on the changelog,
243 The ellipsis dag is stored as revnums on the changelog,
244 but when we're producing ellipsis entries for
244 but when we're producing ellipsis entries for
245 non-changelog revlogs, we need to turn those numbers into
245 non-changelog revlogs, we need to turn those numbers into
246 something local. This does that for us, and during the
246 something local. This does that for us, and during the
247 changelog sending phase will also expand the stored
247 changelog sending phase will also expand the stored
248 mappings as needed.
248 mappings as needed.
249 """
249 """
250 if clrev == node.nullrev:
250 if clrev == node.nullrev:
251 return node.nullrev
251 return node.nullrev
252 if not self.changelog_done:
252 if not self.changelog_done:
253 # If we're doing the changelog, it's possible that we
253 # If we're doing the changelog, it's possible that we
254 # have a parent that is already on the client, and we
254 # have a parent that is already on the client, and we
255 # need to store some extra mapping information so that
255 # need to store some extra mapping information so that
256 # our contained ellipsis nodes will be able to resolve
256 # our contained ellipsis nodes will be able to resolve
257 # their parents.
257 # their parents.
258 if clrev not in self.clrev_to_localrev:
258 if clrev not in self.clrev_to_localrev:
259 clnode = revlog.node(clrev)
259 clnode = revlog.node(clrev)
260 self.clnode_to_rev[clnode] = clrev
260 self.clnode_to_rev[clnode] = clrev
261 return clrev
261 return clrev
262 # Walk the ellipsis-ized changelog breadth-first looking for a
262 # Walk the ellipsis-ized changelog breadth-first looking for a
263 # change that has been linked from the current revlog.
263 # change that has been linked from the current revlog.
264 #
264 #
265 # For a flat manifest revlog only a single step should be necessary
265 # For a flat manifest revlog only a single step should be necessary
266 # as all relevant changelog entries are relevant to the flat
266 # as all relevant changelog entries are relevant to the flat
267 # manifest.
267 # manifest.
268 #
268 #
269 # For a filelog or tree manifest dirlog however not every changelog
269 # For a filelog or tree manifest dirlog however not every changelog
270 # entry will have been relevant, so we need to skip some changelog
270 # entry will have been relevant, so we need to skip some changelog
271 # nodes even after ellipsis-izing.
271 # nodes even after ellipsis-izing.
272 walk = [clrev]
272 walk = [clrev]
273 while walk:
273 while walk:
274 p = walk[0]
274 p = walk[0]
275 walk = walk[1:]
275 walk = walk[1:]
276 if p in self.clrev_to_localrev:
276 if p in self.clrev_to_localrev:
277 return self.clrev_to_localrev[p]
277 return self.clrev_to_localrev[p]
278 elif p in self.full_nodes:
278 elif p in self.full_nodes:
279 walk.extend([pp for pp in self._repo.changelog.parentrevs(p)
279 walk.extend([pp for pp in self._repo.changelog.parentrevs(p)
280 if pp != node.nullrev])
280 if pp != node.nullrev])
281 elif p in self.precomputed_ellipsis:
281 elif p in self.precomputed_ellipsis:
282 walk.extend([pp for pp in self.precomputed_ellipsis[p]
282 walk.extend([pp for pp in self.precomputed_ellipsis[p]
283 if pp != node.nullrev])
283 if pp != node.nullrev])
284 else:
284 else:
285 # In this case, we've got an ellipsis with parents
285 # In this case, we've got an ellipsis with parents
286 # outside the current bundle (likely an
286 # outside the current bundle (likely an
287 # incremental pull). We "know" that we can use the
287 # incremental pull). We "know" that we can use the
288 # value of this same revlog at whatever revision
288 # value of this same revlog at whatever revision
289 # is pointed to by linknode. "Know" is in scare
289 # is pointed to by linknode. "Know" is in scare
290 # quotes because I haven't done enough examination
290 # quotes because I haven't done enough examination
291 # of edge cases to convince myself this is really
291 # of edge cases to convince myself this is really
292 # a fact - it works for all the (admittedly
292 # a fact - it works for all the (admittedly
293 # thorough) cases in our testsuite, but I would be
293 # thorough) cases in our testsuite, but I would be
294 # somewhat unsurprised to find a case in the wild
294 # somewhat unsurprised to find a case in the wild
295 # where this breaks down a bit. That said, I don't
295 # where this breaks down a bit. That said, I don't
296 # know if it would hurt anything.
296 # know if it would hurt anything.
297 for i in pycompat.xrange(rev, 0, -1):
297 for i in pycompat.xrange(rev, 0, -1):
298 if revlog.linkrev(i) == clrev:
298 if revlog.linkrev(i) == clrev:
299 return i
299 return i
300 # We failed to resolve a parent for this node, so
300 # We failed to resolve a parent for this node, so
301 # we crash the changegroup construction.
301 # we crash the changegroup construction.
302 raise error.Abort(
302 raise error.Abort(
303 'unable to resolve parent while packing %r %r'
303 'unable to resolve parent while packing %r %r'
304 ' for changeset %r' % (revlog.indexfile, rev, clrev))
304 ' for changeset %r' % (revlog.indexfile, rev, clrev))
305 return node.nullrev
305 return node.nullrev
306
306
307 if not linkparents or (
307 if not linkparents or (
308 revlog.parentrevs(rev) == (node.nullrev, node.nullrev)):
308 revlog.parentrevs(rev) == (node.nullrev, node.nullrev)):
309 p1, p2 = node.nullrev, node.nullrev
309 p1, p2 = node.nullrev, node.nullrev
310 elif len(linkparents) == 1:
310 elif len(linkparents) == 1:
311 p1, = sorted(local(p) for p in linkparents)
311 p1, = sorted(local(p) for p in linkparents)
312 p2 = node.nullrev
312 p2 = node.nullrev
313 else:
313 else:
314 p1, p2 = sorted(local(p) for p in linkparents)
314 p1, p2 = sorted(local(p) for p in linkparents)
315 n = revlog.node(rev)
315 n = revlog.node(rev)
316 yield changegroup.ellipsisdata(
316 yield changegroup.ellipsisdata(
317 self, rev, revlog, p1, p2, revlog.revision(n), linknode)
317 self, rev, revlog, p1, p2, revlog.revision(n), linknode)
318 extensions.wrapfunction(changegroup.cg1packer, 'revchunk', revchunk)
318 extensions.wrapfunction(changegroup.cg1packer, 'revchunk', revchunk)
319
320 def deltaparent(orig, self, revlog, rev, p1, p2, prev):
321 if util.safehasattr(self, 'full_nodes'):
322 # TODO: send better deltas when in narrow mode.
323 #
324 # changegroup.group() loops over revisions to send,
325 # including revisions we'll skip. What this means is that
326 # `prev` will be a potentially useless delta base for all
327 # ellipsis nodes, as the client likely won't have it. In
328 # the future we should do bookkeeping about which nodes
329 # have been sent to the client, and try to be
330 # significantly smarter about delta bases. This is
331 # slightly tricky because this same code has to work for
332 # all revlogs, and we don't have the linkrev/linknode here.
333 return p1
334 return orig(self, revlog, rev, p1, p2, prev)
335 extensions.wrapfunction(changegroup.cg2packer, 'deltaparent', deltaparent)
@@ -1,1090 +1,1105 b''
1 # changegroup.py - Mercurial changegroup manipulation functions
1 # changegroup.py - Mercurial changegroup manipulation functions
2 #
2 #
3 # Copyright 2006 Matt Mackall <mpm@selenic.com>
3 # Copyright 2006 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import os
10 import os
11 import struct
11 import struct
12 import weakref
12 import weakref
13
13
14 from .i18n import _
14 from .i18n import _
15 from .node import (
15 from .node import (
16 hex,
16 hex,
17 nullid,
17 nullid,
18 nullrev,
18 nullrev,
19 short,
19 short,
20 )
20 )
21
21
22 from . import (
22 from . import (
23 dagutil,
23 dagutil,
24 error,
24 error,
25 manifest,
25 manifest,
26 match as matchmod,
26 match as matchmod,
27 mdiff,
27 mdiff,
28 phases,
28 phases,
29 pycompat,
29 pycompat,
30 repository,
30 repository,
31 revlog,
31 revlog,
32 util,
32 util,
33 )
33 )
34
34
35 from .utils import (
35 from .utils import (
36 stringutil,
36 stringutil,
37 )
37 )
38
38
39 _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
39 _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
40 _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
40 _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
41 _CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"
41 _CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"
42
42
43 LFS_REQUIREMENT = 'lfs'
43 LFS_REQUIREMENT = 'lfs'
44
44
45 readexactly = util.readexactly
45 readexactly = util.readexactly
46
46
47 def getchunk(stream):
47 def getchunk(stream):
48 """return the next chunk from stream as a string"""
48 """return the next chunk from stream as a string"""
49 d = readexactly(stream, 4)
49 d = readexactly(stream, 4)
50 l = struct.unpack(">l", d)[0]
50 l = struct.unpack(">l", d)[0]
51 if l <= 4:
51 if l <= 4:
52 if l:
52 if l:
53 raise error.Abort(_("invalid chunk length %d") % l)
53 raise error.Abort(_("invalid chunk length %d") % l)
54 return ""
54 return ""
55 return readexactly(stream, l - 4)
55 return readexactly(stream, l - 4)
56
56
57 def chunkheader(length):
57 def chunkheader(length):
58 """return a changegroup chunk header (string)"""
58 """return a changegroup chunk header (string)"""
59 return struct.pack(">l", length + 4)
59 return struct.pack(">l", length + 4)
60
60
61 def closechunk():
61 def closechunk():
62 """return a changegroup chunk header (string) for a zero-length chunk"""
62 """return a changegroup chunk header (string) for a zero-length chunk"""
63 return struct.pack(">l", 0)
63 return struct.pack(">l", 0)
64
64
65 def writechunks(ui, chunks, filename, vfs=None):
65 def writechunks(ui, chunks, filename, vfs=None):
66 """Write chunks to a file and return its filename.
66 """Write chunks to a file and return its filename.
67
67
68 The stream is assumed to be a bundle file.
68 The stream is assumed to be a bundle file.
69 Existing files will not be overwritten.
69 Existing files will not be overwritten.
70 If no filename is specified, a temporary file is created.
70 If no filename is specified, a temporary file is created.
71 """
71 """
72 fh = None
72 fh = None
73 cleanup = None
73 cleanup = None
74 try:
74 try:
75 if filename:
75 if filename:
76 if vfs:
76 if vfs:
77 fh = vfs.open(filename, "wb")
77 fh = vfs.open(filename, "wb")
78 else:
78 else:
79 # Increase default buffer size because default is usually
79 # Increase default buffer size because default is usually
80 # small (4k is common on Linux).
80 # small (4k is common on Linux).
81 fh = open(filename, "wb", 131072)
81 fh = open(filename, "wb", 131072)
82 else:
82 else:
83 fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
83 fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
84 fh = os.fdopen(fd, r"wb")
84 fh = os.fdopen(fd, r"wb")
85 cleanup = filename
85 cleanup = filename
86 for c in chunks:
86 for c in chunks:
87 fh.write(c)
87 fh.write(c)
88 cleanup = None
88 cleanup = None
89 return filename
89 return filename
90 finally:
90 finally:
91 if fh is not None:
91 if fh is not None:
92 fh.close()
92 fh.close()
93 if cleanup is not None:
93 if cleanup is not None:
94 if filename and vfs:
94 if filename and vfs:
95 vfs.unlink(cleanup)
95 vfs.unlink(cleanup)
96 else:
96 else:
97 os.unlink(cleanup)
97 os.unlink(cleanup)
98
98
99 class cg1unpacker(object):
99 class cg1unpacker(object):
100 """Unpacker for cg1 changegroup streams.
100 """Unpacker for cg1 changegroup streams.
101
101
102 A changegroup unpacker handles the framing of the revision data in
102 A changegroup unpacker handles the framing of the revision data in
103 the wire format. Most consumers will want to use the apply()
103 the wire format. Most consumers will want to use the apply()
104 method to add the changes from the changegroup to a repository.
104 method to add the changes from the changegroup to a repository.
105
105
106 If you're forwarding a changegroup unmodified to another consumer,
106 If you're forwarding a changegroup unmodified to another consumer,
107 use getchunks(), which returns an iterator of changegroup
107 use getchunks(), which returns an iterator of changegroup
108 chunks. This is mostly useful for cases where you need to know the
108 chunks. This is mostly useful for cases where you need to know the
109 data stream has ended by observing the end of the changegroup.
109 data stream has ended by observing the end of the changegroup.
110
110
111 deltachunk() is useful only if you're applying delta data. Most
111 deltachunk() is useful only if you're applying delta data. Most
112 consumers should prefer apply() instead.
112 consumers should prefer apply() instead.
113
113
114 A few other public methods exist. Those are used only for
114 A few other public methods exist. Those are used only for
115 bundlerepo and some debug commands - their use is discouraged.
115 bundlerepo and some debug commands - their use is discouraged.
116 """
116 """
117 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
117 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
118 deltaheadersize = struct.calcsize(deltaheader)
118 deltaheadersize = struct.calcsize(deltaheader)
119 version = '01'
119 version = '01'
120 _grouplistcount = 1 # One list of files after the manifests
120 _grouplistcount = 1 # One list of files after the manifests
121
121
122 def __init__(self, fh, alg, extras=None):
122 def __init__(self, fh, alg, extras=None):
123 if alg is None:
123 if alg is None:
124 alg = 'UN'
124 alg = 'UN'
125 if alg not in util.compengines.supportedbundletypes:
125 if alg not in util.compengines.supportedbundletypes:
126 raise error.Abort(_('unknown stream compression type: %s')
126 raise error.Abort(_('unknown stream compression type: %s')
127 % alg)
127 % alg)
128 if alg == 'BZ':
128 if alg == 'BZ':
129 alg = '_truncatedBZ'
129 alg = '_truncatedBZ'
130
130
131 compengine = util.compengines.forbundletype(alg)
131 compengine = util.compengines.forbundletype(alg)
132 self._stream = compengine.decompressorreader(fh)
132 self._stream = compengine.decompressorreader(fh)
133 self._type = alg
133 self._type = alg
134 self.extras = extras or {}
134 self.extras = extras or {}
135 self.callback = None
135 self.callback = None
136
136
137 # These methods (compressed, read, seek, tell) all appear to only
137 # These methods (compressed, read, seek, tell) all appear to only
138 # be used by bundlerepo, but it's a little hard to tell.
138 # be used by bundlerepo, but it's a little hard to tell.
139 def compressed(self):
139 def compressed(self):
140 return self._type is not None and self._type != 'UN'
140 return self._type is not None and self._type != 'UN'
141 def read(self, l):
141 def read(self, l):
142 return self._stream.read(l)
142 return self._stream.read(l)
143 def seek(self, pos):
143 def seek(self, pos):
144 return self._stream.seek(pos)
144 return self._stream.seek(pos)
145 def tell(self):
145 def tell(self):
146 return self._stream.tell()
146 return self._stream.tell()
147 def close(self):
147 def close(self):
148 return self._stream.close()
148 return self._stream.close()
149
149
150 def _chunklength(self):
150 def _chunklength(self):
151 d = readexactly(self._stream, 4)
151 d = readexactly(self._stream, 4)
152 l = struct.unpack(">l", d)[0]
152 l = struct.unpack(">l", d)[0]
153 if l <= 4:
153 if l <= 4:
154 if l:
154 if l:
155 raise error.Abort(_("invalid chunk length %d") % l)
155 raise error.Abort(_("invalid chunk length %d") % l)
156 return 0
156 return 0
157 if self.callback:
157 if self.callback:
158 self.callback()
158 self.callback()
159 return l - 4
159 return l - 4
160
160
161 def changelogheader(self):
161 def changelogheader(self):
162 """v10 does not have a changelog header chunk"""
162 """v10 does not have a changelog header chunk"""
163 return {}
163 return {}
164
164
165 def manifestheader(self):
165 def manifestheader(self):
166 """v10 does not have a manifest header chunk"""
166 """v10 does not have a manifest header chunk"""
167 return {}
167 return {}
168
168
169 def filelogheader(self):
169 def filelogheader(self):
170 """return the header of the filelogs chunk, v10 only has the filename"""
170 """return the header of the filelogs chunk, v10 only has the filename"""
171 l = self._chunklength()
171 l = self._chunklength()
172 if not l:
172 if not l:
173 return {}
173 return {}
174 fname = readexactly(self._stream, l)
174 fname = readexactly(self._stream, l)
175 return {'filename': fname}
175 return {'filename': fname}
176
176
177 def _deltaheader(self, headertuple, prevnode):
177 def _deltaheader(self, headertuple, prevnode):
178 node, p1, p2, cs = headertuple
178 node, p1, p2, cs = headertuple
179 if prevnode is None:
179 if prevnode is None:
180 deltabase = p1
180 deltabase = p1
181 else:
181 else:
182 deltabase = prevnode
182 deltabase = prevnode
183 flags = 0
183 flags = 0
184 return node, p1, p2, deltabase, cs, flags
184 return node, p1, p2, deltabase, cs, flags
185
185
186 def deltachunk(self, prevnode):
186 def deltachunk(self, prevnode):
187 l = self._chunklength()
187 l = self._chunklength()
188 if not l:
188 if not l:
189 return {}
189 return {}
190 headerdata = readexactly(self._stream, self.deltaheadersize)
190 headerdata = readexactly(self._stream, self.deltaheadersize)
191 header = struct.unpack(self.deltaheader, headerdata)
191 header = struct.unpack(self.deltaheader, headerdata)
192 delta = readexactly(self._stream, l - self.deltaheadersize)
192 delta = readexactly(self._stream, l - self.deltaheadersize)
193 node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
193 node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
194 return (node, p1, p2, cs, deltabase, delta, flags)
194 return (node, p1, p2, cs, deltabase, delta, flags)
195
195
196 def getchunks(self):
196 def getchunks(self):
197 """returns all the chunks contains in the bundle
197 """returns all the chunks contains in the bundle
198
198
199 Used when you need to forward the binary stream to a file or another
199 Used when you need to forward the binary stream to a file or another
200 network API. To do so, it parse the changegroup data, otherwise it will
200 network API. To do so, it parse the changegroup data, otherwise it will
201 block in case of sshrepo because it don't know the end of the stream.
201 block in case of sshrepo because it don't know the end of the stream.
202 """
202 """
203 # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
203 # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
204 # and a list of filelogs. For changegroup 3, we expect 4 parts:
204 # and a list of filelogs. For changegroup 3, we expect 4 parts:
205 # changelog, manifestlog, a list of tree manifestlogs, and a list of
205 # changelog, manifestlog, a list of tree manifestlogs, and a list of
206 # filelogs.
206 # filelogs.
207 #
207 #
208 # Changelog and manifestlog parts are terminated with empty chunks. The
208 # Changelog and manifestlog parts are terminated with empty chunks. The
209 # tree and file parts are a list of entry sections. Each entry section
209 # tree and file parts are a list of entry sections. Each entry section
210 # is a series of chunks terminating in an empty chunk. The list of these
210 # is a series of chunks terminating in an empty chunk. The list of these
211 # entry sections is terminated in yet another empty chunk, so we know
211 # entry sections is terminated in yet another empty chunk, so we know
212 # we've reached the end of the tree/file list when we reach an empty
212 # we've reached the end of the tree/file list when we reach an empty
213 # chunk that was proceeded by no non-empty chunks.
213 # chunk that was proceeded by no non-empty chunks.
214
214
215 parts = 0
215 parts = 0
216 while parts < 2 + self._grouplistcount:
216 while parts < 2 + self._grouplistcount:
217 noentries = True
217 noentries = True
218 while True:
218 while True:
219 chunk = getchunk(self)
219 chunk = getchunk(self)
220 if not chunk:
220 if not chunk:
221 # The first two empty chunks represent the end of the
221 # The first two empty chunks represent the end of the
222 # changelog and the manifestlog portions. The remaining
222 # changelog and the manifestlog portions. The remaining
223 # empty chunks represent either A) the end of individual
223 # empty chunks represent either A) the end of individual
224 # tree or file entries in the file list, or B) the end of
224 # tree or file entries in the file list, or B) the end of
225 # the entire list. It's the end of the entire list if there
225 # the entire list. It's the end of the entire list if there
226 # were no entries (i.e. noentries is True).
226 # were no entries (i.e. noentries is True).
227 if parts < 2:
227 if parts < 2:
228 parts += 1
228 parts += 1
229 elif noentries:
229 elif noentries:
230 parts += 1
230 parts += 1
231 break
231 break
232 noentries = False
232 noentries = False
233 yield chunkheader(len(chunk))
233 yield chunkheader(len(chunk))
234 pos = 0
234 pos = 0
235 while pos < len(chunk):
235 while pos < len(chunk):
236 next = pos + 2**20
236 next = pos + 2**20
237 yield chunk[pos:next]
237 yield chunk[pos:next]
238 pos = next
238 pos = next
239 yield closechunk()
239 yield closechunk()
240
240
241 def _unpackmanifests(self, repo, revmap, trp, prog):
241 def _unpackmanifests(self, repo, revmap, trp, prog):
242 self.callback = prog.increment
242 self.callback = prog.increment
243 # no need to check for empty manifest group here:
243 # no need to check for empty manifest group here:
244 # if the result of the merge of 1 and 2 is the same in 3 and 4,
244 # if the result of the merge of 1 and 2 is the same in 3 and 4,
245 # no new manifest will be created and the manifest group will
245 # no new manifest will be created and the manifest group will
246 # be empty during the pull
246 # be empty during the pull
247 self.manifestheader()
247 self.manifestheader()
248 deltas = self.deltaiter()
248 deltas = self.deltaiter()
249 repo.manifestlog.addgroup(deltas, revmap, trp)
249 repo.manifestlog.addgroup(deltas, revmap, trp)
250 prog.complete()
250 prog.complete()
251 self.callback = None
251 self.callback = None
252
252
253 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
253 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
254 expectedtotal=None):
254 expectedtotal=None):
255 """Add the changegroup returned by source.read() to this repo.
255 """Add the changegroup returned by source.read() to this repo.
256 srctype is a string like 'push', 'pull', or 'unbundle'. url is
256 srctype is a string like 'push', 'pull', or 'unbundle'. url is
257 the URL of the repo where this changegroup is coming from.
257 the URL of the repo where this changegroup is coming from.
258
258
259 Return an integer summarizing the change to this repo:
259 Return an integer summarizing the change to this repo:
260 - nothing changed or no source: 0
260 - nothing changed or no source: 0
261 - more heads than before: 1+added heads (2..n)
261 - more heads than before: 1+added heads (2..n)
262 - fewer heads than before: -1-removed heads (-2..-n)
262 - fewer heads than before: -1-removed heads (-2..-n)
263 - number of heads stays the same: 1
263 - number of heads stays the same: 1
264 """
264 """
265 repo = repo.unfiltered()
265 repo = repo.unfiltered()
266 def csmap(x):
266 def csmap(x):
267 repo.ui.debug("add changeset %s\n" % short(x))
267 repo.ui.debug("add changeset %s\n" % short(x))
268 return len(cl)
268 return len(cl)
269
269
270 def revmap(x):
270 def revmap(x):
271 return cl.rev(x)
271 return cl.rev(x)
272
272
273 changesets = files = revisions = 0
273 changesets = files = revisions = 0
274
274
275 try:
275 try:
276 # The transaction may already carry source information. In this
276 # The transaction may already carry source information. In this
277 # case we use the top level data. We overwrite the argument
277 # case we use the top level data. We overwrite the argument
278 # because we need to use the top level value (if they exist)
278 # because we need to use the top level value (if they exist)
279 # in this function.
279 # in this function.
280 srctype = tr.hookargs.setdefault('source', srctype)
280 srctype = tr.hookargs.setdefault('source', srctype)
281 url = tr.hookargs.setdefault('url', url)
281 url = tr.hookargs.setdefault('url', url)
282 repo.hook('prechangegroup',
282 repo.hook('prechangegroup',
283 throw=True, **pycompat.strkwargs(tr.hookargs))
283 throw=True, **pycompat.strkwargs(tr.hookargs))
284
284
285 # write changelog data to temp files so concurrent readers
285 # write changelog data to temp files so concurrent readers
286 # will not see an inconsistent view
286 # will not see an inconsistent view
287 cl = repo.changelog
287 cl = repo.changelog
288 cl.delayupdate(tr)
288 cl.delayupdate(tr)
289 oldheads = set(cl.heads())
289 oldheads = set(cl.heads())
290
290
291 trp = weakref.proxy(tr)
291 trp = weakref.proxy(tr)
292 # pull off the changeset group
292 # pull off the changeset group
293 repo.ui.status(_("adding changesets\n"))
293 repo.ui.status(_("adding changesets\n"))
294 clstart = len(cl)
294 clstart = len(cl)
295 progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
295 progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
296 total=expectedtotal)
296 total=expectedtotal)
297 self.callback = progress.increment
297 self.callback = progress.increment
298
298
299 efiles = set()
299 efiles = set()
300 def onchangelog(cl, node):
300 def onchangelog(cl, node):
301 efiles.update(cl.readfiles(node))
301 efiles.update(cl.readfiles(node))
302
302
303 self.changelogheader()
303 self.changelogheader()
304 deltas = self.deltaiter()
304 deltas = self.deltaiter()
305 cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
305 cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
306 efiles = len(efiles)
306 efiles = len(efiles)
307
307
308 if not cgnodes:
308 if not cgnodes:
309 repo.ui.develwarn('applied empty changegroup',
309 repo.ui.develwarn('applied empty changegroup',
310 config='warn-empty-changegroup')
310 config='warn-empty-changegroup')
311 clend = len(cl)
311 clend = len(cl)
312 changesets = clend - clstart
312 changesets = clend - clstart
313 progress.complete()
313 progress.complete()
314 self.callback = None
314 self.callback = None
315
315
316 # pull off the manifest group
316 # pull off the manifest group
317 repo.ui.status(_("adding manifests\n"))
317 repo.ui.status(_("adding manifests\n"))
318 # We know that we'll never have more manifests than we had
318 # We know that we'll never have more manifests than we had
319 # changesets.
319 # changesets.
320 progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
320 progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
321 total=changesets)
321 total=changesets)
322 self._unpackmanifests(repo, revmap, trp, progress)
322 self._unpackmanifests(repo, revmap, trp, progress)
323
323
324 needfiles = {}
324 needfiles = {}
325 if repo.ui.configbool('server', 'validate'):
325 if repo.ui.configbool('server', 'validate'):
326 cl = repo.changelog
326 cl = repo.changelog
327 ml = repo.manifestlog
327 ml = repo.manifestlog
328 # validate incoming csets have their manifests
328 # validate incoming csets have their manifests
329 for cset in pycompat.xrange(clstart, clend):
329 for cset in pycompat.xrange(clstart, clend):
330 mfnode = cl.changelogrevision(cset).manifest
330 mfnode = cl.changelogrevision(cset).manifest
331 mfest = ml[mfnode].readdelta()
331 mfest = ml[mfnode].readdelta()
332 # store file cgnodes we must see
332 # store file cgnodes we must see
333 for f, n in mfest.iteritems():
333 for f, n in mfest.iteritems():
334 needfiles.setdefault(f, set()).add(n)
334 needfiles.setdefault(f, set()).add(n)
335
335
336 # process the files
336 # process the files
337 repo.ui.status(_("adding file changes\n"))
337 repo.ui.status(_("adding file changes\n"))
338 newrevs, newfiles = _addchangegroupfiles(
338 newrevs, newfiles = _addchangegroupfiles(
339 repo, self, revmap, trp, efiles, needfiles)
339 repo, self, revmap, trp, efiles, needfiles)
340 revisions += newrevs
340 revisions += newrevs
341 files += newfiles
341 files += newfiles
342
342
343 deltaheads = 0
343 deltaheads = 0
344 if oldheads:
344 if oldheads:
345 heads = cl.heads()
345 heads = cl.heads()
346 deltaheads = len(heads) - len(oldheads)
346 deltaheads = len(heads) - len(oldheads)
347 for h in heads:
347 for h in heads:
348 if h not in oldheads and repo[h].closesbranch():
348 if h not in oldheads and repo[h].closesbranch():
349 deltaheads -= 1
349 deltaheads -= 1
350 htext = ""
350 htext = ""
351 if deltaheads:
351 if deltaheads:
352 htext = _(" (%+d heads)") % deltaheads
352 htext = _(" (%+d heads)") % deltaheads
353
353
354 repo.ui.status(_("added %d changesets"
354 repo.ui.status(_("added %d changesets"
355 " with %d changes to %d files%s\n")
355 " with %d changes to %d files%s\n")
356 % (changesets, revisions, files, htext))
356 % (changesets, revisions, files, htext))
357 repo.invalidatevolatilesets()
357 repo.invalidatevolatilesets()
358
358
359 if changesets > 0:
359 if changesets > 0:
360 if 'node' not in tr.hookargs:
360 if 'node' not in tr.hookargs:
361 tr.hookargs['node'] = hex(cl.node(clstart))
361 tr.hookargs['node'] = hex(cl.node(clstart))
362 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
362 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
363 hookargs = dict(tr.hookargs)
363 hookargs = dict(tr.hookargs)
364 else:
364 else:
365 hookargs = dict(tr.hookargs)
365 hookargs = dict(tr.hookargs)
366 hookargs['node'] = hex(cl.node(clstart))
366 hookargs['node'] = hex(cl.node(clstart))
367 hookargs['node_last'] = hex(cl.node(clend - 1))
367 hookargs['node_last'] = hex(cl.node(clend - 1))
368 repo.hook('pretxnchangegroup',
368 repo.hook('pretxnchangegroup',
369 throw=True, **pycompat.strkwargs(hookargs))
369 throw=True, **pycompat.strkwargs(hookargs))
370
370
371 added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
371 added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
372 phaseall = None
372 phaseall = None
373 if srctype in ('push', 'serve'):
373 if srctype in ('push', 'serve'):
374 # Old servers can not push the boundary themselves.
374 # Old servers can not push the boundary themselves.
375 # New servers won't push the boundary if changeset already
375 # New servers won't push the boundary if changeset already
376 # exists locally as secret
376 # exists locally as secret
377 #
377 #
378 # We should not use added here but the list of all change in
378 # We should not use added here but the list of all change in
379 # the bundle
379 # the bundle
380 if repo.publishing():
380 if repo.publishing():
381 targetphase = phaseall = phases.public
381 targetphase = phaseall = phases.public
382 else:
382 else:
383 # closer target phase computation
383 # closer target phase computation
384
384
385 # Those changesets have been pushed from the
385 # Those changesets have been pushed from the
386 # outside, their phases are going to be pushed
386 # outside, their phases are going to be pushed
387 # alongside. Therefor `targetphase` is
387 # alongside. Therefor `targetphase` is
388 # ignored.
388 # ignored.
389 targetphase = phaseall = phases.draft
389 targetphase = phaseall = phases.draft
390 if added:
390 if added:
391 phases.registernew(repo, tr, targetphase, added)
391 phases.registernew(repo, tr, targetphase, added)
392 if phaseall is not None:
392 if phaseall is not None:
393 phases.advanceboundary(repo, tr, phaseall, cgnodes)
393 phases.advanceboundary(repo, tr, phaseall, cgnodes)
394
394
395 if changesets > 0:
395 if changesets > 0:
396
396
397 def runhooks():
397 def runhooks():
398 # These hooks run when the lock releases, not when the
398 # These hooks run when the lock releases, not when the
399 # transaction closes. So it's possible for the changelog
399 # transaction closes. So it's possible for the changelog
400 # to have changed since we last saw it.
400 # to have changed since we last saw it.
401 if clstart >= len(repo):
401 if clstart >= len(repo):
402 return
402 return
403
403
404 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
404 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
405
405
406 for n in added:
406 for n in added:
407 args = hookargs.copy()
407 args = hookargs.copy()
408 args['node'] = hex(n)
408 args['node'] = hex(n)
409 del args['node_last']
409 del args['node_last']
410 repo.hook("incoming", **pycompat.strkwargs(args))
410 repo.hook("incoming", **pycompat.strkwargs(args))
411
411
412 newheads = [h for h in repo.heads()
412 newheads = [h for h in repo.heads()
413 if h not in oldheads]
413 if h not in oldheads]
414 repo.ui.log("incoming",
414 repo.ui.log("incoming",
415 "%d incoming changes - new heads: %s\n",
415 "%d incoming changes - new heads: %s\n",
416 len(added),
416 len(added),
417 ', '.join([hex(c[:6]) for c in newheads]))
417 ', '.join([hex(c[:6]) for c in newheads]))
418
418
419 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
419 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
420 lambda tr: repo._afterlock(runhooks))
420 lambda tr: repo._afterlock(runhooks))
421 finally:
421 finally:
422 repo.ui.flush()
422 repo.ui.flush()
423 # never return 0 here:
423 # never return 0 here:
424 if deltaheads < 0:
424 if deltaheads < 0:
425 ret = deltaheads - 1
425 ret = deltaheads - 1
426 else:
426 else:
427 ret = deltaheads + 1
427 ret = deltaheads + 1
428 return ret
428 return ret
429
429
430 def deltaiter(self):
430 def deltaiter(self):
431 """
431 """
432 returns an iterator of the deltas in this changegroup
432 returns an iterator of the deltas in this changegroup
433
433
434 Useful for passing to the underlying storage system to be stored.
434 Useful for passing to the underlying storage system to be stored.
435 """
435 """
436 chain = None
436 chain = None
437 for chunkdata in iter(lambda: self.deltachunk(chain), {}):
437 for chunkdata in iter(lambda: self.deltachunk(chain), {}):
438 # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
438 # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
439 yield chunkdata
439 yield chunkdata
440 chain = chunkdata[0]
440 chain = chunkdata[0]
441
441
442 class cg2unpacker(cg1unpacker):
442 class cg2unpacker(cg1unpacker):
443 """Unpacker for cg2 streams.
443 """Unpacker for cg2 streams.
444
444
445 cg2 streams add support for generaldelta, so the delta header
445 cg2 streams add support for generaldelta, so the delta header
446 format is slightly different. All other features about the data
446 format is slightly different. All other features about the data
447 remain the same.
447 remain the same.
448 """
448 """
449 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
449 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
450 deltaheadersize = struct.calcsize(deltaheader)
450 deltaheadersize = struct.calcsize(deltaheader)
451 version = '02'
451 version = '02'
452
452
453 def _deltaheader(self, headertuple, prevnode):
453 def _deltaheader(self, headertuple, prevnode):
454 node, p1, p2, deltabase, cs = headertuple
454 node, p1, p2, deltabase, cs = headertuple
455 flags = 0
455 flags = 0
456 return node, p1, p2, deltabase, cs, flags
456 return node, p1, p2, deltabase, cs, flags
457
457
458 class cg3unpacker(cg2unpacker):
458 class cg3unpacker(cg2unpacker):
459 """Unpacker for cg3 streams.
459 """Unpacker for cg3 streams.
460
460
461 cg3 streams add support for exchanging treemanifests and revlog
461 cg3 streams add support for exchanging treemanifests and revlog
462 flags. It adds the revlog flags to the delta header and an empty chunk
462 flags. It adds the revlog flags to the delta header and an empty chunk
463 separating manifests and files.
463 separating manifests and files.
464 """
464 """
465 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
465 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
466 deltaheadersize = struct.calcsize(deltaheader)
466 deltaheadersize = struct.calcsize(deltaheader)
467 version = '03'
467 version = '03'
468 _grouplistcount = 2 # One list of manifests and one list of files
468 _grouplistcount = 2 # One list of manifests and one list of files
469
469
470 def _deltaheader(self, headertuple, prevnode):
470 def _deltaheader(self, headertuple, prevnode):
471 node, p1, p2, deltabase, cs, flags = headertuple
471 node, p1, p2, deltabase, cs, flags = headertuple
472 return node, p1, p2, deltabase, cs, flags
472 return node, p1, p2, deltabase, cs, flags
473
473
474 def _unpackmanifests(self, repo, revmap, trp, prog):
474 def _unpackmanifests(self, repo, revmap, trp, prog):
475 super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
475 super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
476 for chunkdata in iter(self.filelogheader, {}):
476 for chunkdata in iter(self.filelogheader, {}):
477 # If we get here, there are directory manifests in the changegroup
477 # If we get here, there are directory manifests in the changegroup
478 d = chunkdata["filename"]
478 d = chunkdata["filename"]
479 repo.ui.debug("adding %s revisions\n" % d)
479 repo.ui.debug("adding %s revisions\n" % d)
480 dirlog = repo.manifestlog._revlog.dirlog(d)
480 dirlog = repo.manifestlog._revlog.dirlog(d)
481 deltas = self.deltaiter()
481 deltas = self.deltaiter()
482 if not dirlog.addgroup(deltas, revmap, trp):
482 if not dirlog.addgroup(deltas, revmap, trp):
483 raise error.Abort(_("received dir revlog group is empty"))
483 raise error.Abort(_("received dir revlog group is empty"))
484
484
485 class headerlessfixup(object):
485 class headerlessfixup(object):
486 def __init__(self, fh, h):
486 def __init__(self, fh, h):
487 self._h = h
487 self._h = h
488 self._fh = fh
488 self._fh = fh
489 def read(self, n):
489 def read(self, n):
490 if self._h:
490 if self._h:
491 d, self._h = self._h[:n], self._h[n:]
491 d, self._h = self._h[:n], self._h[n:]
492 if len(d) < n:
492 if len(d) < n:
493 d += readexactly(self._fh, n - len(d))
493 d += readexactly(self._fh, n - len(d))
494 return d
494 return d
495 return readexactly(self._fh, n)
495 return readexactly(self._fh, n)
496
496
497 def ellipsisdata(packer, rev, revlog_, p1, p2, data, linknode):
497 def ellipsisdata(packer, rev, revlog_, p1, p2, data, linknode):
498 n = revlog_.node(rev)
498 n = revlog_.node(rev)
499 p1n, p2n = revlog_.node(p1), revlog_.node(p2)
499 p1n, p2n = revlog_.node(p1), revlog_.node(p2)
500 flags = revlog_.flags(rev)
500 flags = revlog_.flags(rev)
501 flags |= revlog.REVIDX_ELLIPSIS
501 flags |= revlog.REVIDX_ELLIPSIS
502 meta = packer.builddeltaheader(
502 meta = packer.builddeltaheader(
503 n, p1n, p2n, nullid, linknode, flags)
503 n, p1n, p2n, nullid, linknode, flags)
504 # TODO: try and actually send deltas for ellipsis data blocks
504 # TODO: try and actually send deltas for ellipsis data blocks
505 diffheader = mdiff.trivialdiffheader(len(data))
505 diffheader = mdiff.trivialdiffheader(len(data))
506 l = len(meta) + len(diffheader) + len(data)
506 l = len(meta) + len(diffheader) + len(data)
507 return ''.join((chunkheader(l),
507 return ''.join((chunkheader(l),
508 meta,
508 meta,
509 diffheader,
509 diffheader,
510 data))
510 data))
511
511
512 class cg1packer(object):
512 class cg1packer(object):
513 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
513 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
514 version = '01'
514 version = '01'
515 def __init__(self, repo, filematcher, bundlecaps=None):
515 def __init__(self, repo, filematcher, bundlecaps=None):
516 """Given a source repo, construct a bundler.
516 """Given a source repo, construct a bundler.
517
517
518 filematcher is a matcher that matches on files to include in the
518 filematcher is a matcher that matches on files to include in the
519 changegroup. Used to facilitate sparse changegroups.
519 changegroup. Used to facilitate sparse changegroups.
520
520
521 bundlecaps is optional and can be used to specify the set of
521 bundlecaps is optional and can be used to specify the set of
522 capabilities which can be used to build the bundle. While bundlecaps is
522 capabilities which can be used to build the bundle. While bundlecaps is
523 unused in core Mercurial, extensions rely on this feature to communicate
523 unused in core Mercurial, extensions rely on this feature to communicate
524 capabilities to customize the changegroup packer.
524 capabilities to customize the changegroup packer.
525 """
525 """
526 assert filematcher
526 assert filematcher
527 self._filematcher = filematcher
527 self._filematcher = filematcher
528
528
529 # Set of capabilities we can use to build the bundle.
529 # Set of capabilities we can use to build the bundle.
530 if bundlecaps is None:
530 if bundlecaps is None:
531 bundlecaps = set()
531 bundlecaps = set()
532 self._bundlecaps = bundlecaps
532 self._bundlecaps = bundlecaps
533 # experimental config: bundle.reorder
533 # experimental config: bundle.reorder
534 reorder = repo.ui.config('bundle', 'reorder')
534 reorder = repo.ui.config('bundle', 'reorder')
535 if reorder == 'auto':
535 if reorder == 'auto':
536 reorder = None
536 reorder = None
537 else:
537 else:
538 reorder = stringutil.parsebool(reorder)
538 reorder = stringutil.parsebool(reorder)
539 self._repo = repo
539 self._repo = repo
540 self._reorder = reorder
540 self._reorder = reorder
541 if self._repo.ui.verbose and not self._repo.ui.debugflag:
541 if self._repo.ui.verbose and not self._repo.ui.debugflag:
542 self._verbosenote = self._repo.ui.note
542 self._verbosenote = self._repo.ui.note
543 else:
543 else:
544 self._verbosenote = lambda s: None
544 self._verbosenote = lambda s: None
545
545
546 def close(self):
546 def close(self):
547 return closechunk()
547 return closechunk()
548
548
549 def fileheader(self, fname):
549 def fileheader(self, fname):
550 return chunkheader(len(fname)) + fname
550 return chunkheader(len(fname)) + fname
551
551
552 # Extracted both for clarity and for overriding in extensions.
552 # Extracted both for clarity and for overriding in extensions.
553 def _sortgroup(self, revlog, nodelist, lookup):
553 def _sortgroup(self, revlog, nodelist, lookup):
554 """Sort nodes for change group and turn them into revnums."""
554 """Sort nodes for change group and turn them into revnums."""
555 # for generaldelta revlogs, we linearize the revs; this will both be
555 # for generaldelta revlogs, we linearize the revs; this will both be
556 # much quicker and generate a much smaller bundle
556 # much quicker and generate a much smaller bundle
557 if (revlog._generaldelta and self._reorder is None) or self._reorder:
557 if (revlog._generaldelta and self._reorder is None) or self._reorder:
558 dag = dagutil.revlogdag(revlog)
558 dag = dagutil.revlogdag(revlog)
559 return dag.linearize(set(revlog.rev(n) for n in nodelist))
559 return dag.linearize(set(revlog.rev(n) for n in nodelist))
560 else:
560 else:
561 return sorted([revlog.rev(n) for n in nodelist])
561 return sorted([revlog.rev(n) for n in nodelist])
562
562
563 def group(self, nodelist, revlog, lookup, units=None):
563 def group(self, nodelist, revlog, lookup, units=None):
564 """Calculate a delta group, yielding a sequence of changegroup chunks
564 """Calculate a delta group, yielding a sequence of changegroup chunks
565 (strings).
565 (strings).
566
566
567 Given a list of changeset revs, return a set of deltas and
567 Given a list of changeset revs, return a set of deltas and
568 metadata corresponding to nodes. The first delta is
568 metadata corresponding to nodes. The first delta is
569 first parent(nodelist[0]) -> nodelist[0], the receiver is
569 first parent(nodelist[0]) -> nodelist[0], the receiver is
570 guaranteed to have this parent as it has all history before
570 guaranteed to have this parent as it has all history before
571 these changesets. In the case firstparent is nullrev the
571 these changesets. In the case firstparent is nullrev the
572 changegroup starts with a full revision.
572 changegroup starts with a full revision.
573
573
574 If units is not None, progress detail will be generated, units specifies
574 If units is not None, progress detail will be generated, units specifies
575 the type of revlog that is touched (changelog, manifest, etc.).
575 the type of revlog that is touched (changelog, manifest, etc.).
576 """
576 """
577 # if we don't have any revisions touched by these changesets, bail
577 # if we don't have any revisions touched by these changesets, bail
578 if len(nodelist) == 0:
578 if len(nodelist) == 0:
579 yield self.close()
579 yield self.close()
580 return
580 return
581
581
582 revs = self._sortgroup(revlog, nodelist, lookup)
582 revs = self._sortgroup(revlog, nodelist, lookup)
583
583
584 # add the parent of the first rev
584 # add the parent of the first rev
585 p = revlog.parentrevs(revs[0])[0]
585 p = revlog.parentrevs(revs[0])[0]
586 revs.insert(0, p)
586 revs.insert(0, p)
587
587
588 # build deltas
588 # build deltas
589 progress = None
589 progress = None
590 if units is not None:
590 if units is not None:
591 progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
591 progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
592 total=(len(revs) - 1))
592 total=(len(revs) - 1))
593 for r in pycompat.xrange(len(revs) - 1):
593 for r in pycompat.xrange(len(revs) - 1):
594 if progress:
594 if progress:
595 progress.update(r + 1)
595 progress.update(r + 1)
596 prev, curr = revs[r], revs[r + 1]
596 prev, curr = revs[r], revs[r + 1]
597 linknode = lookup(revlog.node(curr))
597 linknode = lookup(revlog.node(curr))
598 for c in self.revchunk(revlog, curr, prev, linknode):
598 for c in self.revchunk(revlog, curr, prev, linknode):
599 yield c
599 yield c
600
600
601 if progress:
601 if progress:
602 progress.complete()
602 progress.complete()
603 yield self.close()
603 yield self.close()
604
604
605 # filter any nodes that claim to be part of the known set
605 # filter any nodes that claim to be part of the known set
606 def prune(self, revlog, missing, commonrevs):
606 def prune(self, revlog, missing, commonrevs):
607 # TODO this violates storage abstraction for manifests.
607 # TODO this violates storage abstraction for manifests.
608 if isinstance(revlog, manifest.manifestrevlog):
608 if isinstance(revlog, manifest.manifestrevlog):
609 if not self._filematcher.visitdir(revlog._dir[:-1] or '.'):
609 if not self._filematcher.visitdir(revlog._dir[:-1] or '.'):
610 return []
610 return []
611
611
612 rr, rl = revlog.rev, revlog.linkrev
612 rr, rl = revlog.rev, revlog.linkrev
613 return [n for n in missing if rl(rr(n)) not in commonrevs]
613 return [n for n in missing if rl(rr(n)) not in commonrevs]
614
614
615 def _packmanifests(self, dir, mfnodes, lookuplinknode):
615 def _packmanifests(self, dir, mfnodes, lookuplinknode):
616 """Pack flat manifests into a changegroup stream."""
616 """Pack flat manifests into a changegroup stream."""
617 assert not dir
617 assert not dir
618 for chunk in self.group(mfnodes, self._repo.manifestlog._revlog,
618 for chunk in self.group(mfnodes, self._repo.manifestlog._revlog,
619 lookuplinknode, units=_('manifests')):
619 lookuplinknode, units=_('manifests')):
620 yield chunk
620 yield chunk
621
621
622 def _manifestsdone(self):
622 def _manifestsdone(self):
623 return ''
623 return ''
624
624
625 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
625 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
626 '''yield a sequence of changegroup chunks (strings)'''
626 '''yield a sequence of changegroup chunks (strings)'''
627 repo = self._repo
627 repo = self._repo
628 cl = repo.changelog
628 cl = repo.changelog
629
629
630 clrevorder = {}
630 clrevorder = {}
631 mfs = {} # needed manifests
631 mfs = {} # needed manifests
632 fnodes = {} # needed file nodes
632 fnodes = {} # needed file nodes
633 changedfiles = set()
633 changedfiles = set()
634
634
635 # Callback for the changelog, used to collect changed files and manifest
635 # Callback for the changelog, used to collect changed files and manifest
636 # nodes.
636 # nodes.
637 # Returns the linkrev node (identity in the changelog case).
637 # Returns the linkrev node (identity in the changelog case).
638 def lookupcl(x):
638 def lookupcl(x):
639 c = cl.read(x)
639 c = cl.read(x)
640 clrevorder[x] = len(clrevorder)
640 clrevorder[x] = len(clrevorder)
641 n = c[0]
641 n = c[0]
642 # record the first changeset introducing this manifest version
642 # record the first changeset introducing this manifest version
643 mfs.setdefault(n, x)
643 mfs.setdefault(n, x)
644 # Record a complete list of potentially-changed files in
644 # Record a complete list of potentially-changed files in
645 # this manifest.
645 # this manifest.
646 changedfiles.update(c[3])
646 changedfiles.update(c[3])
647 return x
647 return x
648
648
649 self._verbosenote(_('uncompressed size of bundle content:\n'))
649 self._verbosenote(_('uncompressed size of bundle content:\n'))
650 size = 0
650 size = 0
651 for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
651 for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
652 size += len(chunk)
652 size += len(chunk)
653 yield chunk
653 yield chunk
654 self._verbosenote(_('%8.i (changelog)\n') % size)
654 self._verbosenote(_('%8.i (changelog)\n') % size)
655
655
656 # We need to make sure that the linkrev in the changegroup refers to
656 # We need to make sure that the linkrev in the changegroup refers to
657 # the first changeset that introduced the manifest or file revision.
657 # the first changeset that introduced the manifest or file revision.
658 # The fastpath is usually safer than the slowpath, because the filelogs
658 # The fastpath is usually safer than the slowpath, because the filelogs
659 # are walked in revlog order.
659 # are walked in revlog order.
660 #
660 #
661 # When taking the slowpath with reorder=None and the manifest revlog
661 # When taking the slowpath with reorder=None and the manifest revlog
662 # uses generaldelta, the manifest may be walked in the "wrong" order.
662 # uses generaldelta, the manifest may be walked in the "wrong" order.
663 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
663 # Without 'clrevorder', we would get an incorrect linkrev (see fix in
664 # cc0ff93d0c0c).
664 # cc0ff93d0c0c).
665 #
665 #
666 # When taking the fastpath, we are only vulnerable to reordering
666 # When taking the fastpath, we are only vulnerable to reordering
667 # of the changelog itself. The changelog never uses generaldelta, so
667 # of the changelog itself. The changelog never uses generaldelta, so
668 # it is only reordered when reorder=True. To handle this case, we
668 # it is only reordered when reorder=True. To handle this case, we
669 # simply take the slowpath, which already has the 'clrevorder' logic.
669 # simply take the slowpath, which already has the 'clrevorder' logic.
670 # This was also fixed in cc0ff93d0c0c.
670 # This was also fixed in cc0ff93d0c0c.
671 fastpathlinkrev = fastpathlinkrev and not self._reorder
671 fastpathlinkrev = fastpathlinkrev and not self._reorder
672 # Treemanifests don't work correctly with fastpathlinkrev
672 # Treemanifests don't work correctly with fastpathlinkrev
673 # either, because we don't discover which directory nodes to
673 # either, because we don't discover which directory nodes to
674 # send along with files. This could probably be fixed.
674 # send along with files. This could probably be fixed.
675 fastpathlinkrev = fastpathlinkrev and (
675 fastpathlinkrev = fastpathlinkrev and (
676 'treemanifest' not in repo.requirements)
676 'treemanifest' not in repo.requirements)
677
677
678 for chunk in self.generatemanifests(commonrevs, clrevorder,
678 for chunk in self.generatemanifests(commonrevs, clrevorder,
679 fastpathlinkrev, mfs, fnodes, source):
679 fastpathlinkrev, mfs, fnodes, source):
680 yield chunk
680 yield chunk
681 mfs.clear()
681 mfs.clear()
682 clrevs = set(cl.rev(x) for x in clnodes)
682 clrevs = set(cl.rev(x) for x in clnodes)
683
683
684 if not fastpathlinkrev:
684 if not fastpathlinkrev:
685 def linknodes(unused, fname):
685 def linknodes(unused, fname):
686 return fnodes.get(fname, {})
686 return fnodes.get(fname, {})
687 else:
687 else:
688 cln = cl.node
688 cln = cl.node
689 def linknodes(filerevlog, fname):
689 def linknodes(filerevlog, fname):
690 llr = filerevlog.linkrev
690 llr = filerevlog.linkrev
691 fln = filerevlog.node
691 fln = filerevlog.node
692 revs = ((r, llr(r)) for r in filerevlog)
692 revs = ((r, llr(r)) for r in filerevlog)
693 return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
693 return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
694
694
695 for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
695 for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
696 source):
696 source):
697 yield chunk
697 yield chunk
698
698
699 yield self.close()
699 yield self.close()
700
700
701 if clnodes:
701 if clnodes:
702 repo.hook('outgoing', node=hex(clnodes[0]), source=source)
702 repo.hook('outgoing', node=hex(clnodes[0]), source=source)
703
703
704 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
704 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
705 fnodes, source):
705 fnodes, source):
706 """Returns an iterator of changegroup chunks containing manifests.
706 """Returns an iterator of changegroup chunks containing manifests.
707
707
708 `source` is unused here, but is used by extensions like remotefilelog to
708 `source` is unused here, but is used by extensions like remotefilelog to
709 change what is sent based in pulls vs pushes, etc.
709 change what is sent based in pulls vs pushes, etc.
710 """
710 """
711 repo = self._repo
711 repo = self._repo
712 mfl = repo.manifestlog
712 mfl = repo.manifestlog
713 dirlog = mfl._revlog.dirlog
713 dirlog = mfl._revlog.dirlog
714 tmfnodes = {'': mfs}
714 tmfnodes = {'': mfs}
715
715
716 # Callback for the manifest, used to collect linkrevs for filelog
716 # Callback for the manifest, used to collect linkrevs for filelog
717 # revisions.
717 # revisions.
718 # Returns the linkrev node (collected in lookupcl).
718 # Returns the linkrev node (collected in lookupcl).
719 def makelookupmflinknode(dir, nodes):
719 def makelookupmflinknode(dir, nodes):
720 if fastpathlinkrev:
720 if fastpathlinkrev:
721 assert not dir
721 assert not dir
722 return mfs.__getitem__
722 return mfs.__getitem__
723
723
724 def lookupmflinknode(x):
724 def lookupmflinknode(x):
725 """Callback for looking up the linknode for manifests.
725 """Callback for looking up the linknode for manifests.
726
726
727 Returns the linkrev node for the specified manifest.
727 Returns the linkrev node for the specified manifest.
728
728
729 SIDE EFFECT:
729 SIDE EFFECT:
730
730
731 1) fclnodes gets populated with the list of relevant
731 1) fclnodes gets populated with the list of relevant
732 file nodes if we're not using fastpathlinkrev
732 file nodes if we're not using fastpathlinkrev
733 2) When treemanifests are in use, collects treemanifest nodes
733 2) When treemanifests are in use, collects treemanifest nodes
734 to send
734 to send
735
735
736 Note that this means manifests must be completely sent to
736 Note that this means manifests must be completely sent to
737 the client before you can trust the list of files and
737 the client before you can trust the list of files and
738 treemanifests to send.
738 treemanifests to send.
739 """
739 """
740 clnode = nodes[x]
740 clnode = nodes[x]
741 mdata = mfl.get(dir, x).readfast(shallow=True)
741 mdata = mfl.get(dir, x).readfast(shallow=True)
742 for p, n, fl in mdata.iterentries():
742 for p, n, fl in mdata.iterentries():
743 if fl == 't': # subdirectory manifest
743 if fl == 't': # subdirectory manifest
744 subdir = dir + p + '/'
744 subdir = dir + p + '/'
745 tmfclnodes = tmfnodes.setdefault(subdir, {})
745 tmfclnodes = tmfnodes.setdefault(subdir, {})
746 tmfclnode = tmfclnodes.setdefault(n, clnode)
746 tmfclnode = tmfclnodes.setdefault(n, clnode)
747 if clrevorder[clnode] < clrevorder[tmfclnode]:
747 if clrevorder[clnode] < clrevorder[tmfclnode]:
748 tmfclnodes[n] = clnode
748 tmfclnodes[n] = clnode
749 else:
749 else:
750 f = dir + p
750 f = dir + p
751 fclnodes = fnodes.setdefault(f, {})
751 fclnodes = fnodes.setdefault(f, {})
752 fclnode = fclnodes.setdefault(n, clnode)
752 fclnode = fclnodes.setdefault(n, clnode)
753 if clrevorder[clnode] < clrevorder[fclnode]:
753 if clrevorder[clnode] < clrevorder[fclnode]:
754 fclnodes[n] = clnode
754 fclnodes[n] = clnode
755 return clnode
755 return clnode
756 return lookupmflinknode
756 return lookupmflinknode
757
757
758 size = 0
758 size = 0
759 while tmfnodes:
759 while tmfnodes:
760 dir, nodes = tmfnodes.popitem()
760 dir, nodes = tmfnodes.popitem()
761 prunednodes = self.prune(dirlog(dir), nodes, commonrevs)
761 prunednodes = self.prune(dirlog(dir), nodes, commonrevs)
762 if not dir or prunednodes:
762 if not dir or prunednodes:
763 for x in self._packmanifests(dir, prunednodes,
763 for x in self._packmanifests(dir, prunednodes,
764 makelookupmflinknode(dir, nodes)):
764 makelookupmflinknode(dir, nodes)):
765 size += len(x)
765 size += len(x)
766 yield x
766 yield x
767 self._verbosenote(_('%8.i (manifests)\n') % size)
767 self._verbosenote(_('%8.i (manifests)\n') % size)
768 yield self._manifestsdone()
768 yield self._manifestsdone()
769
769
770 # The 'source' parameter is useful for extensions
770 # The 'source' parameter is useful for extensions
771 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
771 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
772 repo = self._repo
772 repo = self._repo
773 progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
773 progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
774 total=len(changedfiles))
774 total=len(changedfiles))
775 for i, fname in enumerate(sorted(changedfiles)):
775 for i, fname in enumerate(sorted(changedfiles)):
776 filerevlog = repo.file(fname)
776 filerevlog = repo.file(fname)
777 if not filerevlog:
777 if not filerevlog:
778 raise error.Abort(_("empty or missing file data for %s") %
778 raise error.Abort(_("empty or missing file data for %s") %
779 fname)
779 fname)
780
780
781 linkrevnodes = linknodes(filerevlog, fname)
781 linkrevnodes = linknodes(filerevlog, fname)
782 # Lookup for filenodes, we collected the linkrev nodes above in the
782 # Lookup for filenodes, we collected the linkrev nodes above in the
783 # fastpath case and with lookupmf in the slowpath case.
783 # fastpath case and with lookupmf in the slowpath case.
784 def lookupfilelog(x):
784 def lookupfilelog(x):
785 return linkrevnodes[x]
785 return linkrevnodes[x]
786
786
787 filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
787 filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
788 if filenodes:
788 if filenodes:
789 progress.update(i + 1, item=fname)
789 progress.update(i + 1, item=fname)
790 h = self.fileheader(fname)
790 h = self.fileheader(fname)
791 size = len(h)
791 size = len(h)
792 yield h
792 yield h
793 for chunk in self.group(filenodes, filerevlog, lookupfilelog):
793 for chunk in self.group(filenodes, filerevlog, lookupfilelog):
794 size += len(chunk)
794 size += len(chunk)
795 yield chunk
795 yield chunk
796 self._verbosenote(_('%8.i %s\n') % (size, fname))
796 self._verbosenote(_('%8.i %s\n') % (size, fname))
797 progress.complete()
797 progress.complete()
798
798
799 def deltaparent(self, revlog, rev, p1, p2, prev):
799 def deltaparent(self, revlog, rev, p1, p2, prev):
800 if not revlog.candelta(prev, rev):
800 if not revlog.candelta(prev, rev):
801 raise error.ProgrammingError('cg1 should not be used in this case')
801 raise error.ProgrammingError('cg1 should not be used in this case')
802 return prev
802 return prev
803
803
804 def revchunk(self, revlog, rev, prev, linknode):
804 def revchunk(self, revlog, rev, prev, linknode):
805 node = revlog.node(rev)
805 node = revlog.node(rev)
806 p1, p2 = revlog.parentrevs(rev)
806 p1, p2 = revlog.parentrevs(rev)
807 base = self.deltaparent(revlog, rev, p1, p2, prev)
807 base = self.deltaparent(revlog, rev, p1, p2, prev)
808
808
809 prefix = ''
809 prefix = ''
810 if revlog.iscensored(base) or revlog.iscensored(rev):
810 if revlog.iscensored(base) or revlog.iscensored(rev):
811 try:
811 try:
812 delta = revlog.revision(node, raw=True)
812 delta = revlog.revision(node, raw=True)
813 except error.CensoredNodeError as e:
813 except error.CensoredNodeError as e:
814 delta = e.tombstone
814 delta = e.tombstone
815 if base == nullrev:
815 if base == nullrev:
816 prefix = mdiff.trivialdiffheader(len(delta))
816 prefix = mdiff.trivialdiffheader(len(delta))
817 else:
817 else:
818 baselen = revlog.rawsize(base)
818 baselen = revlog.rawsize(base)
819 prefix = mdiff.replacediffheader(baselen, len(delta))
819 prefix = mdiff.replacediffheader(baselen, len(delta))
820 elif base == nullrev:
820 elif base == nullrev:
821 delta = revlog.revision(node, raw=True)
821 delta = revlog.revision(node, raw=True)
822 prefix = mdiff.trivialdiffheader(len(delta))
822 prefix = mdiff.trivialdiffheader(len(delta))
823 else:
823 else:
824 delta = revlog.revdiff(base, rev)
824 delta = revlog.revdiff(base, rev)
825 p1n, p2n = revlog.parents(node)
825 p1n, p2n = revlog.parents(node)
826 basenode = revlog.node(base)
826 basenode = revlog.node(base)
827 flags = revlog.flags(rev)
827 flags = revlog.flags(rev)
828 meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)
828 meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)
829 meta += prefix
829 meta += prefix
830 l = len(meta) + len(delta)
830 l = len(meta) + len(delta)
831 yield chunkheader(l)
831 yield chunkheader(l)
832 yield meta
832 yield meta
833 yield delta
833 yield delta
834 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
834 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
835 # do nothing with basenode, it is implicitly the previous one in HG10
835 # do nothing with basenode, it is implicitly the previous one in HG10
836 # do nothing with flags, it is implicitly 0 for cg1 and cg2
836 # do nothing with flags, it is implicitly 0 for cg1 and cg2
837 return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
837 return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
838
838
839 class cg2packer(cg1packer):
839 class cg2packer(cg1packer):
840 version = '02'
840 version = '02'
841 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
841 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
842
842
843 def __init__(self, repo, filematcher, bundlecaps=None):
843 def __init__(self, repo, filematcher, bundlecaps=None):
844 super(cg2packer, self).__init__(repo, filematcher,
844 super(cg2packer, self).__init__(repo, filematcher,
845 bundlecaps=bundlecaps)
845 bundlecaps=bundlecaps)
846
846
847 if self._reorder is None:
847 if self._reorder is None:
848 # Since generaldelta is directly supported by cg2, reordering
848 # Since generaldelta is directly supported by cg2, reordering
849 # generally doesn't help, so we disable it by default (treating
849 # generally doesn't help, so we disable it by default (treating
850 # bundle.reorder=auto just like bundle.reorder=False).
850 # bundle.reorder=auto just like bundle.reorder=False).
851 self._reorder = False
851 self._reorder = False
852
852
853 def deltaparent(self, revlog, rev, p1, p2, prev):
853 def deltaparent(self, revlog, rev, p1, p2, prev):
854 # Narrow ellipses mode.
855 if util.safehasattr(self, 'full_nodes'):
856 # TODO: send better deltas when in narrow mode.
857 #
858 # changegroup.group() loops over revisions to send,
859 # including revisions we'll skip. What this means is that
860 # `prev` will be a potentially useless delta base for all
861 # ellipsis nodes, as the client likely won't have it. In
862 # the future we should do bookkeeping about which nodes
863 # have been sent to the client, and try to be
864 # significantly smarter about delta bases. This is
865 # slightly tricky because this same code has to work for
866 # all revlogs, and we don't have the linkrev/linknode here.
867 return p1
868
854 dp = revlog.deltaparent(rev)
869 dp = revlog.deltaparent(rev)
855 if dp == nullrev and revlog.storedeltachains:
870 if dp == nullrev and revlog.storedeltachains:
856 # Avoid sending full revisions when delta parent is null. Pick prev
871 # Avoid sending full revisions when delta parent is null. Pick prev
857 # in that case. It's tempting to pick p1 in this case, as p1 will
872 # in that case. It's tempting to pick p1 in this case, as p1 will
858 # be smaller in the common case. However, computing a delta against
873 # be smaller in the common case. However, computing a delta against
859 # p1 may require resolving the raw text of p1, which could be
874 # p1 may require resolving the raw text of p1, which could be
860 # expensive. The revlog caches should have prev cached, meaning
875 # expensive. The revlog caches should have prev cached, meaning
861 # less CPU for changegroup generation. There is likely room to add
876 # less CPU for changegroup generation. There is likely room to add
862 # a flag and/or config option to control this behavior.
877 # a flag and/or config option to control this behavior.
863 base = prev
878 base = prev
864 elif dp == nullrev:
879 elif dp == nullrev:
865 # revlog is configured to use full snapshot for a reason,
880 # revlog is configured to use full snapshot for a reason,
866 # stick to full snapshot.
881 # stick to full snapshot.
867 base = nullrev
882 base = nullrev
868 elif dp not in (p1, p2, prev):
883 elif dp not in (p1, p2, prev):
869 # Pick prev when we can't be sure remote has the base revision.
884 # Pick prev when we can't be sure remote has the base revision.
870 return prev
885 return prev
871 else:
886 else:
872 base = dp
887 base = dp
873 if base != nullrev and not revlog.candelta(base, rev):
888 if base != nullrev and not revlog.candelta(base, rev):
874 base = nullrev
889 base = nullrev
875 return base
890 return base
876
891
877 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
892 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
878 # Do nothing with flags, it is implicitly 0 in cg1 and cg2
893 # Do nothing with flags, it is implicitly 0 in cg1 and cg2
879 return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
894 return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
880
895
881 class cg3packer(cg2packer):
896 class cg3packer(cg2packer):
882 version = '03'
897 version = '03'
883 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
898 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
884
899
885 def _packmanifests(self, dir, mfnodes, lookuplinknode):
900 def _packmanifests(self, dir, mfnodes, lookuplinknode):
886 if dir:
901 if dir:
887 yield self.fileheader(dir)
902 yield self.fileheader(dir)
888
903
889 dirlog = self._repo.manifestlog._revlog.dirlog(dir)
904 dirlog = self._repo.manifestlog._revlog.dirlog(dir)
890 for chunk in self.group(mfnodes, dirlog, lookuplinknode,
905 for chunk in self.group(mfnodes, dirlog, lookuplinknode,
891 units=_('manifests')):
906 units=_('manifests')):
892 yield chunk
907 yield chunk
893
908
894 def _manifestsdone(self):
909 def _manifestsdone(self):
895 return self.close()
910 return self.close()
896
911
897 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
912 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
898 return struct.pack(
913 return struct.pack(
899 self.deltaheader, node, p1n, p2n, basenode, linknode, flags)
914 self.deltaheader, node, p1n, p2n, basenode, linknode, flags)
900
915
901 _packermap = {'01': (cg1packer, cg1unpacker),
916 _packermap = {'01': (cg1packer, cg1unpacker),
902 # cg2 adds support for exchanging generaldelta
917 # cg2 adds support for exchanging generaldelta
903 '02': (cg2packer, cg2unpacker),
918 '02': (cg2packer, cg2unpacker),
904 # cg3 adds support for exchanging revlog flags and treemanifests
919 # cg3 adds support for exchanging revlog flags and treemanifests
905 '03': (cg3packer, cg3unpacker),
920 '03': (cg3packer, cg3unpacker),
906 }
921 }
907
922
908 def allsupportedversions(repo):
923 def allsupportedversions(repo):
909 versions = set(_packermap.keys())
924 versions = set(_packermap.keys())
910 if not (repo.ui.configbool('experimental', 'changegroup3') or
925 if not (repo.ui.configbool('experimental', 'changegroup3') or
911 repo.ui.configbool('experimental', 'treemanifest') or
926 repo.ui.configbool('experimental', 'treemanifest') or
912 'treemanifest' in repo.requirements):
927 'treemanifest' in repo.requirements):
913 versions.discard('03')
928 versions.discard('03')
914 return versions
929 return versions
915
930
916 # Changegroup versions that can be applied to the repo
931 # Changegroup versions that can be applied to the repo
917 def supportedincomingversions(repo):
932 def supportedincomingversions(repo):
918 return allsupportedversions(repo)
933 return allsupportedversions(repo)
919
934
920 # Changegroup versions that can be created from the repo
935 # Changegroup versions that can be created from the repo
921 def supportedoutgoingversions(repo):
936 def supportedoutgoingversions(repo):
922 versions = allsupportedversions(repo)
937 versions = allsupportedversions(repo)
923 if 'treemanifest' in repo.requirements:
938 if 'treemanifest' in repo.requirements:
924 # Versions 01 and 02 support only flat manifests and it's just too
939 # Versions 01 and 02 support only flat manifests and it's just too
925 # expensive to convert between the flat manifest and tree manifest on
940 # expensive to convert between the flat manifest and tree manifest on
926 # the fly. Since tree manifests are hashed differently, all of history
941 # the fly. Since tree manifests are hashed differently, all of history
927 # would have to be converted. Instead, we simply don't even pretend to
942 # would have to be converted. Instead, we simply don't even pretend to
928 # support versions 01 and 02.
943 # support versions 01 and 02.
929 versions.discard('01')
944 versions.discard('01')
930 versions.discard('02')
945 versions.discard('02')
931 if repository.NARROW_REQUIREMENT in repo.requirements:
946 if repository.NARROW_REQUIREMENT in repo.requirements:
932 # Versions 01 and 02 don't support revlog flags, and we need to
947 # Versions 01 and 02 don't support revlog flags, and we need to
933 # support that for stripping and unbundling to work.
948 # support that for stripping and unbundling to work.
934 versions.discard('01')
949 versions.discard('01')
935 versions.discard('02')
950 versions.discard('02')
936 if LFS_REQUIREMENT in repo.requirements:
951 if LFS_REQUIREMENT in repo.requirements:
937 # Versions 01 and 02 don't support revlog flags, and we need to
952 # Versions 01 and 02 don't support revlog flags, and we need to
938 # mark LFS entries with REVIDX_EXTSTORED.
953 # mark LFS entries with REVIDX_EXTSTORED.
939 versions.discard('01')
954 versions.discard('01')
940 versions.discard('02')
955 versions.discard('02')
941
956
942 return versions
957 return versions
943
958
944 def localversion(repo):
959 def localversion(repo):
945 # Finds the best version to use for bundles that are meant to be used
960 # Finds the best version to use for bundles that are meant to be used
946 # locally, such as those from strip and shelve, and temporary bundles.
961 # locally, such as those from strip and shelve, and temporary bundles.
947 return max(supportedoutgoingversions(repo))
962 return max(supportedoutgoingversions(repo))
948
963
949 def safeversion(repo):
964 def safeversion(repo):
950 # Finds the smallest version that it's safe to assume clients of the repo
965 # Finds the smallest version that it's safe to assume clients of the repo
951 # will support. For example, all hg versions that support generaldelta also
966 # will support. For example, all hg versions that support generaldelta also
952 # support changegroup 02.
967 # support changegroup 02.
953 versions = supportedoutgoingversions(repo)
968 versions = supportedoutgoingversions(repo)
954 if 'generaldelta' in repo.requirements:
969 if 'generaldelta' in repo.requirements:
955 versions.discard('01')
970 versions.discard('01')
956 assert versions
971 assert versions
957 return min(versions)
972 return min(versions)
958
973
959 def getbundler(version, repo, bundlecaps=None, filematcher=None):
974 def getbundler(version, repo, bundlecaps=None, filematcher=None):
960 assert version in supportedoutgoingversions(repo)
975 assert version in supportedoutgoingversions(repo)
961
976
962 if filematcher is None:
977 if filematcher is None:
963 filematcher = matchmod.alwaysmatcher(repo.root, '')
978 filematcher = matchmod.alwaysmatcher(repo.root, '')
964
979
965 if version == '01' and not filematcher.always():
980 if version == '01' and not filematcher.always():
966 raise error.ProgrammingError('version 01 changegroups do not support '
981 raise error.ProgrammingError('version 01 changegroups do not support '
967 'sparse file matchers')
982 'sparse file matchers')
968
983
969 # Requested files could include files not in the local store. So
984 # Requested files could include files not in the local store. So
970 # filter those out.
985 # filter those out.
971 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
986 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
972 filematcher)
987 filematcher)
973
988
974 return _packermap[version][0](repo, filematcher=filematcher,
989 return _packermap[version][0](repo, filematcher=filematcher,
975 bundlecaps=bundlecaps)
990 bundlecaps=bundlecaps)
976
991
977 def getunbundler(version, fh, alg, extras=None):
992 def getunbundler(version, fh, alg, extras=None):
978 return _packermap[version][1](fh, alg, extras=extras)
993 return _packermap[version][1](fh, alg, extras=extras)
979
994
980 def _changegroupinfo(repo, nodes, source):
995 def _changegroupinfo(repo, nodes, source):
981 if repo.ui.verbose or source == 'bundle':
996 if repo.ui.verbose or source == 'bundle':
982 repo.ui.status(_("%d changesets found\n") % len(nodes))
997 repo.ui.status(_("%d changesets found\n") % len(nodes))
983 if repo.ui.debugflag:
998 if repo.ui.debugflag:
984 repo.ui.debug("list of changesets:\n")
999 repo.ui.debug("list of changesets:\n")
985 for node in nodes:
1000 for node in nodes:
986 repo.ui.debug("%s\n" % hex(node))
1001 repo.ui.debug("%s\n" % hex(node))
987
1002
988 def makechangegroup(repo, outgoing, version, source, fastpath=False,
1003 def makechangegroup(repo, outgoing, version, source, fastpath=False,
989 bundlecaps=None):
1004 bundlecaps=None):
990 cgstream = makestream(repo, outgoing, version, source,
1005 cgstream = makestream(repo, outgoing, version, source,
991 fastpath=fastpath, bundlecaps=bundlecaps)
1006 fastpath=fastpath, bundlecaps=bundlecaps)
992 return getunbundler(version, util.chunkbuffer(cgstream), None,
1007 return getunbundler(version, util.chunkbuffer(cgstream), None,
993 {'clcount': len(outgoing.missing) })
1008 {'clcount': len(outgoing.missing) })
994
1009
995 def makestream(repo, outgoing, version, source, fastpath=False,
1010 def makestream(repo, outgoing, version, source, fastpath=False,
996 bundlecaps=None, filematcher=None):
1011 bundlecaps=None, filematcher=None):
997 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
1012 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
998 filematcher=filematcher)
1013 filematcher=filematcher)
999
1014
1000 repo = repo.unfiltered()
1015 repo = repo.unfiltered()
1001 commonrevs = outgoing.common
1016 commonrevs = outgoing.common
1002 csets = outgoing.missing
1017 csets = outgoing.missing
1003 heads = outgoing.missingheads
1018 heads = outgoing.missingheads
1004 # We go through the fast path if we get told to, or if all (unfiltered
1019 # We go through the fast path if we get told to, or if all (unfiltered
1005 # heads have been requested (since we then know there all linkrevs will
1020 # heads have been requested (since we then know there all linkrevs will
1006 # be pulled by the client).
1021 # be pulled by the client).
1007 heads.sort()
1022 heads.sort()
1008 fastpathlinkrev = fastpath or (
1023 fastpathlinkrev = fastpath or (
1009 repo.filtername is None and heads == sorted(repo.heads()))
1024 repo.filtername is None and heads == sorted(repo.heads()))
1010
1025
1011 repo.hook('preoutgoing', throw=True, source=source)
1026 repo.hook('preoutgoing', throw=True, source=source)
1012 _changegroupinfo(repo, csets, source)
1027 _changegroupinfo(repo, csets, source)
1013 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
1028 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
1014
1029
1015 def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
1030 def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
1016 revisions = 0
1031 revisions = 0
1017 files = 0
1032 files = 0
1018 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
1033 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
1019 total=expectedfiles)
1034 total=expectedfiles)
1020 for chunkdata in iter(source.filelogheader, {}):
1035 for chunkdata in iter(source.filelogheader, {}):
1021 files += 1
1036 files += 1
1022 f = chunkdata["filename"]
1037 f = chunkdata["filename"]
1023 repo.ui.debug("adding %s revisions\n" % f)
1038 repo.ui.debug("adding %s revisions\n" % f)
1024 progress.increment()
1039 progress.increment()
1025 fl = repo.file(f)
1040 fl = repo.file(f)
1026 o = len(fl)
1041 o = len(fl)
1027 try:
1042 try:
1028 deltas = source.deltaiter()
1043 deltas = source.deltaiter()
1029 if not fl.addgroup(deltas, revmap, trp):
1044 if not fl.addgroup(deltas, revmap, trp):
1030 raise error.Abort(_("received file revlog group is empty"))
1045 raise error.Abort(_("received file revlog group is empty"))
1031 except error.CensoredBaseError as e:
1046 except error.CensoredBaseError as e:
1032 raise error.Abort(_("received delta base is censored: %s") % e)
1047 raise error.Abort(_("received delta base is censored: %s") % e)
1033 revisions += len(fl) - o
1048 revisions += len(fl) - o
1034 if f in needfiles:
1049 if f in needfiles:
1035 needs = needfiles[f]
1050 needs = needfiles[f]
1036 for new in pycompat.xrange(o, len(fl)):
1051 for new in pycompat.xrange(o, len(fl)):
1037 n = fl.node(new)
1052 n = fl.node(new)
1038 if n in needs:
1053 if n in needs:
1039 needs.remove(n)
1054 needs.remove(n)
1040 else:
1055 else:
1041 raise error.Abort(
1056 raise error.Abort(
1042 _("received spurious file revlog entry"))
1057 _("received spurious file revlog entry"))
1043 if not needs:
1058 if not needs:
1044 del needfiles[f]
1059 del needfiles[f]
1045 progress.complete()
1060 progress.complete()
1046
1061
1047 for f, needs in needfiles.iteritems():
1062 for f, needs in needfiles.iteritems():
1048 fl = repo.file(f)
1063 fl = repo.file(f)
1049 for n in needs:
1064 for n in needs:
1050 try:
1065 try:
1051 fl.rev(n)
1066 fl.rev(n)
1052 except error.LookupError:
1067 except error.LookupError:
1053 raise error.Abort(
1068 raise error.Abort(
1054 _('missing file data for %s:%s - run hg verify') %
1069 _('missing file data for %s:%s - run hg verify') %
1055 (f, hex(n)))
1070 (f, hex(n)))
1056
1071
1057 return revisions, files
1072 return revisions, files
1058
1073
1059 def _packellipsischangegroup(repo, common, match, relevant_nodes,
1074 def _packellipsischangegroup(repo, common, match, relevant_nodes,
1060 ellipsisroots, visitnodes, depth, source, version):
1075 ellipsisroots, visitnodes, depth, source, version):
1061 if version in ('01', '02'):
1076 if version in ('01', '02'):
1062 raise error.Abort(
1077 raise error.Abort(
1063 'ellipsis nodes require at least cg3 on client and server, '
1078 'ellipsis nodes require at least cg3 on client and server, '
1064 'but negotiated version %s' % version)
1079 'but negotiated version %s' % version)
1065 # We wrap cg1packer.revchunk, using a side channel to pass
1080 # We wrap cg1packer.revchunk, using a side channel to pass
1066 # relevant_nodes into that area. Then if linknode isn't in the
1081 # relevant_nodes into that area. Then if linknode isn't in the
1067 # set, we know we have an ellipsis node and we should defer
1082 # set, we know we have an ellipsis node and we should defer
1068 # sending that node's data. We override close() to detect
1083 # sending that node's data. We override close() to detect
1069 # pending ellipsis nodes and flush them.
1084 # pending ellipsis nodes and flush them.
1070 packer = getbundler(version, repo, filematcher=match)
1085 packer = getbundler(version, repo, filematcher=match)
1071 # Give the packer the list of nodes which should not be
1086 # Give the packer the list of nodes which should not be
1072 # ellipsis nodes. We store this rather than the set of nodes
1087 # ellipsis nodes. We store this rather than the set of nodes
1073 # that should be an ellipsis because for very large histories
1088 # that should be an ellipsis because for very large histories
1074 # we expect this to be significantly smaller.
1089 # we expect this to be significantly smaller.
1075 packer.full_nodes = relevant_nodes
1090 packer.full_nodes = relevant_nodes
1076 # Maps ellipsis revs to their roots at the changelog level.
1091 # Maps ellipsis revs to their roots at the changelog level.
1077 packer.precomputed_ellipsis = ellipsisroots
1092 packer.precomputed_ellipsis = ellipsisroots
1078 # Maps CL revs to per-revlog revisions. Cleared in close() at
1093 # Maps CL revs to per-revlog revisions. Cleared in close() at
1079 # the end of each group.
1094 # the end of each group.
1080 packer.clrev_to_localrev = {}
1095 packer.clrev_to_localrev = {}
1081 packer.next_clrev_to_localrev = {}
1096 packer.next_clrev_to_localrev = {}
1082 # Maps changelog nodes to changelog revs. Filled in once
1097 # Maps changelog nodes to changelog revs. Filled in once
1083 # during changelog stage and then left unmodified.
1098 # during changelog stage and then left unmodified.
1084 packer.clnode_to_rev = {}
1099 packer.clnode_to_rev = {}
1085 packer.changelog_done = False
1100 packer.changelog_done = False
1086 # If true, informs the packer that it is serving shallow content and might
1101 # If true, informs the packer that it is serving shallow content and might
1087 # need to pack file contents not introduced by the changes being packed.
1102 # need to pack file contents not introduced by the changes being packed.
1088 packer.is_shallow = depth is not None
1103 packer.is_shallow = depth is not None
1089
1104
1090 return packer.generate(common, visitnodes, False, source)
1105 return packer.generate(common, visitnodes, False, source)
General Comments 0
You need to be logged in to leave comments. Login now