##// END OF EJS Templates
narrowbundle2: more kwargs native string fixes...
Augie Fackler -
r36377:adce75cd default
parent child Browse files
Show More
@@ -1,494 +1,494 b''
1 1 # narrowbundle2.py - bundle2 extensions for narrow repository support
2 2 #
3 3 # Copyright 2017 Google, Inc.
4 4 #
5 5 # This software may be used and distributed according to the terms of the
6 6 # GNU General Public License version 2 or any later version.
7 7
8 8 from __future__ import absolute_import
9 9
10 10 import collections
11 11 import errno
12 12 import struct
13 13
14 14 from mercurial.i18n import _
15 15 from mercurial.node import (
16 16 bin,
17 17 nullid,
18 18 nullrev,
19 19 )
20 20 from mercurial import (
21 21 bundle2,
22 22 changegroup,
23 23 dagutil,
24 24 error,
25 25 exchange,
26 26 extensions,
27 27 narrowspec,
28 28 repair,
29 29 util,
30 30 wireproto,
31 31 )
32 32
33 33 from . import (
34 34 narrowrepo,
35 35 )
36 36
37 37 NARROWCAP = 'narrow'
38 38 _NARROWACL_SECTION = 'narrowhgacl'
39 39 _CHANGESPECPART = NARROWCAP + ':changespec'
40 40 _SPECPART = NARROWCAP + ':spec'
41 41 _SPECPART_INCLUDE = 'include'
42 42 _SPECPART_EXCLUDE = 'exclude'
43 43 _KILLNODESIGNAL = 'KILL'
44 44 _DONESIGNAL = 'DONE'
45 45 _ELIDEDCSHEADER = '>20s20s20sl' # cset id, p1, p2, len(text)
46 46 _ELIDEDMFHEADER = '>20s20s20s20sl' # manifest id, p1, p2, link id, len(text)
47 47 _CSHEADERSIZE = struct.calcsize(_ELIDEDCSHEADER)
48 48 _MFHEADERSIZE = struct.calcsize(_ELIDEDMFHEADER)
49 49
50 50 # When advertising capabilities, always include narrow clone support.
51 51 def getrepocaps_narrow(orig, repo, **kwargs):
52 52 caps = orig(repo, **kwargs)
53 53 caps[NARROWCAP] = ['v0']
54 54 return caps
55 55
56 56 def _computeellipsis(repo, common, heads, known, match, depth=None):
57 57 """Compute the shape of a narrowed DAG.
58 58
59 59 Args:
60 60 repo: The repository we're transferring.
61 61 common: The roots of the DAG range we're transferring.
62 62 May be just [nullid], which means all ancestors of heads.
63 63 heads: The heads of the DAG range we're transferring.
64 64 match: The narrowmatcher that allows us to identify relevant changes.
65 65 depth: If not None, only consider nodes to be full nodes if they are at
66 66 most depth changesets away from one of heads.
67 67
68 68 Returns:
69 69 A tuple of (visitnodes, relevant_nodes, ellipsisroots) where:
70 70
71 71 visitnodes: The list of nodes (either full or ellipsis) which
72 72 need to be sent to the client.
73 73 relevant_nodes: The set of changelog nodes which change a file inside
74 74 the narrowspec. The client needs these as non-ellipsis nodes.
75 75 ellipsisroots: A dict of {rev: parents} that is used in
76 76 narrowchangegroup to produce ellipsis nodes with the
77 77 correct parents.
78 78 """
79 79 cl = repo.changelog
80 80 mfl = repo.manifestlog
81 81
82 82 cldag = dagutil.revlogdag(cl)
83 83 # dagutil does not like nullid/nullrev
84 84 commonrevs = cldag.internalizeall(common - set([nullid])) | set([nullrev])
85 85 headsrevs = cldag.internalizeall(heads)
86 86 if depth:
87 87 revdepth = {h: 0 for h in headsrevs}
88 88
89 89 ellipsisheads = collections.defaultdict(set)
90 90 ellipsisroots = collections.defaultdict(set)
91 91
92 92 def addroot(head, curchange):
93 93 """Add a root to an ellipsis head, splitting heads with 3 roots."""
94 94 ellipsisroots[head].add(curchange)
95 95 # Recursively split ellipsis heads with 3 roots by finding the
96 96 # roots' youngest common descendant which is an elided merge commit.
97 97 # That descendant takes 2 of the 3 roots as its own, and becomes a
98 98 # root of the head.
99 99 while len(ellipsisroots[head]) > 2:
100 100 child, roots = splithead(head)
101 101 splitroots(head, child, roots)
102 102 head = child # Recurse in case we just added a 3rd root
103 103
104 104 def splitroots(head, child, roots):
105 105 ellipsisroots[head].difference_update(roots)
106 106 ellipsisroots[head].add(child)
107 107 ellipsisroots[child].update(roots)
108 108 ellipsisroots[child].discard(child)
109 109
110 110 def splithead(head):
111 111 r1, r2, r3 = sorted(ellipsisroots[head])
112 112 for nr1, nr2 in ((r2, r3), (r1, r3), (r1, r2)):
113 113 mid = repo.revs('sort(merge() & %d::%d & %d::%d, -rev)',
114 114 nr1, head, nr2, head)
115 115 for j in mid:
116 116 if j == nr2:
117 117 return nr2, (nr1, nr2)
118 118 if j not in ellipsisroots or len(ellipsisroots[j]) < 2:
119 119 return j, (nr1, nr2)
120 120 raise error.Abort('Failed to split up ellipsis node! head: %d, '
121 121 'roots: %d %d %d' % (head, r1, r2, r3))
122 122
123 123 missing = list(cl.findmissingrevs(common=commonrevs, heads=headsrevs))
124 124 visit = reversed(missing)
125 125 relevant_nodes = set()
126 126 visitnodes = [cl.node(m) for m in missing]
127 127 required = set(headsrevs) | known
128 128 for rev in visit:
129 129 clrev = cl.changelogrevision(rev)
130 130 ps = cldag.parents(rev)
131 131 if depth is not None:
132 132 curdepth = revdepth[rev]
133 133 for p in ps:
134 134 revdepth[p] = min(curdepth + 1, revdepth.get(p, depth + 1))
135 135 needed = False
136 136 shallow_enough = depth is None or revdepth[rev] <= depth
137 137 if shallow_enough:
138 138 curmf = mfl[clrev.manifest].read()
139 139 if ps:
140 140 # We choose to not trust the changed files list in
141 141 # changesets because it's not always correct. TODO: could
142 142 # we trust it for the non-merge case?
143 143 p1mf = mfl[cl.changelogrevision(ps[0]).manifest].read()
144 144 needed = bool(curmf.diff(p1mf, match))
145 145 if not needed and len(ps) > 1:
146 146 # For merge changes, the list of changed files is not
147 147 # helpful, since we need to emit the merge if a file
148 148 # in the narrow spec has changed on either side of the
149 149 # merge. As a result, we do a manifest diff to check.
150 150 p2mf = mfl[cl.changelogrevision(ps[1]).manifest].read()
151 151 needed = bool(curmf.diff(p2mf, match))
152 152 else:
153 153 # For a root node, we need to include the node if any
154 154 # files in the node match the narrowspec.
155 155 needed = any(curmf.walk(match))
156 156
157 157 if needed:
158 158 for head in ellipsisheads[rev]:
159 159 addroot(head, rev)
160 160 for p in ps:
161 161 required.add(p)
162 162 relevant_nodes.add(cl.node(rev))
163 163 else:
164 164 if not ps:
165 165 ps = [nullrev]
166 166 if rev in required:
167 167 for head in ellipsisheads[rev]:
168 168 addroot(head, rev)
169 169 for p in ps:
170 170 ellipsisheads[p].add(rev)
171 171 else:
172 172 for p in ps:
173 173 ellipsisheads[p] |= ellipsisheads[rev]
174 174
175 175 # add common changesets as roots of their reachable ellipsis heads
176 176 for c in commonrevs:
177 177 for head in ellipsisheads[c]:
178 178 addroot(head, c)
179 179 return visitnodes, relevant_nodes, ellipsisroots
180 180
181 181 def _packellipsischangegroup(repo, common, match, relevant_nodes,
182 182 ellipsisroots, visitnodes, depth, source, version):
183 183 if version in ('01', '02'):
184 184 raise error.Abort(
185 185 'ellipsis nodes require at least cg3 on client and server, '
186 186 'but negotiated version %s' % version)
187 187 # We wrap cg1packer.revchunk, using a side channel to pass
188 188 # relevant_nodes into that area. Then if linknode isn't in the
189 189 # set, we know we have an ellipsis node and we should defer
190 190 # sending that node's data. We override close() to detect
191 191 # pending ellipsis nodes and flush them.
192 192 packer = changegroup.getbundler(version, repo)
193 193 # Let the packer have access to the narrow matcher so it can
194 194 # omit filelogs and dirlogs as needed
195 195 packer._narrow_matcher = lambda : match
196 196 # Give the packer the list of nodes which should not be
197 197 # ellipsis nodes. We store this rather than the set of nodes
198 198 # that should be an ellipsis because for very large histories
199 199 # we expect this to be significantly smaller.
200 200 packer.full_nodes = relevant_nodes
201 201 # Maps ellipsis revs to their roots at the changelog level.
202 202 packer.precomputed_ellipsis = ellipsisroots
203 203 # Maps CL revs to per-revlog revisions. Cleared in close() at
204 204 # the end of each group.
205 205 packer.clrev_to_localrev = {}
206 206 packer.next_clrev_to_localrev = {}
207 207 # Maps changelog nodes to changelog revs. Filled in once
208 208 # during changelog stage and then left unmodified.
209 209 packer.clnode_to_rev = {}
210 210 packer.changelog_done = False
211 211 # If true, informs the packer that it is serving shallow content and might
212 212 # need to pack file contents not introduced by the changes being packed.
213 213 packer.is_shallow = depth is not None
214 214
215 215 return packer.generate(common, visitnodes, False, source)
216 216
217 217 # Serve a changegroup for a client with a narrow clone.
218 218 def getbundlechangegrouppart_narrow(bundler, repo, source,
219 219 bundlecaps=None, b2caps=None, heads=None,
220 220 common=None, **kwargs):
221 221 cgversions = b2caps.get('changegroup')
222 222 if cgversions: # 3.1 and 3.2 ship with an empty value
223 223 cgversions = [v for v in cgversions
224 224 if v in changegroup.supportedoutgoingversions(repo)]
225 225 if not cgversions:
226 226 raise ValueError(_('no common changegroup version'))
227 227 version = max(cgversions)
228 228 else:
229 229 raise ValueError(_("server does not advertise changegroup version,"
230 230 " can't negotiate support for ellipsis nodes"))
231 231
232 232 include = sorted(filter(bool, kwargs.get(r'includepats', [])))
233 233 exclude = sorted(filter(bool, kwargs.get(r'excludepats', [])))
234 234 newmatch = narrowspec.match(repo.root, include=include, exclude=exclude)
235 235 if not repo.ui.configbool("experimental", "narrowservebrokenellipses"):
236 236 outgoing = exchange._computeoutgoing(repo, heads, common)
237 237 if not outgoing.missing:
238 238 return
239 239 def wrappedgetbundler(orig, *args, **kwargs):
240 240 bundler = orig(*args, **kwargs)
241 241 bundler._narrow_matcher = lambda : newmatch
242 242 return bundler
243 243 with extensions.wrappedfunction(changegroup, 'getbundler',
244 244 wrappedgetbundler):
245 245 cg = changegroup.makestream(repo, outgoing, version, source)
246 246 part = bundler.newpart('changegroup', data=cg)
247 247 part.addparam('version', version)
248 248 if 'treemanifest' in repo.requirements:
249 249 part.addparam('treemanifest', '1')
250 250
251 251 if include or exclude:
252 252 narrowspecpart = bundler.newpart(_SPECPART)
253 253 if include:
254 254 narrowspecpart.addparam(
255 255 _SPECPART_INCLUDE, '\n'.join(include), mandatory=True)
256 256 if exclude:
257 257 narrowspecpart.addparam(
258 258 _SPECPART_EXCLUDE, '\n'.join(exclude), mandatory=True)
259 259
260 260 return
261 261
262 depth = kwargs.get('depth', None)
262 depth = kwargs.get(r'depth', None)
263 263 if depth is not None:
264 264 depth = int(depth)
265 265 if depth < 1:
266 266 raise error.Abort(_('depth must be positive, got %d') % depth)
267 267
268 268 heads = set(heads or repo.heads())
269 269 common = set(common or [nullid])
270 oldinclude = sorted(filter(bool, kwargs.get('oldincludepats', [])))
271 oldexclude = sorted(filter(bool, kwargs.get('oldexcludepats', [])))
272 known = {bin(n) for n in kwargs.get('known', [])}
270 oldinclude = sorted(filter(bool, kwargs.get(r'oldincludepats', [])))
271 oldexclude = sorted(filter(bool, kwargs.get(r'oldexcludepats', [])))
272 known = {bin(n) for n in kwargs.get(r'known', [])}
273 273 if known and (oldinclude != include or oldexclude != exclude):
274 274 # Steps:
275 275 # 1. Send kill for "$known & ::common"
276 276 #
277 277 # 2. Send changegroup for ::common
278 278 #
279 279 # 3. Proceed.
280 280 #
281 281 # In the future, we can send kills for only the specific
282 282 # nodes we know should go away or change shape, and then
283 283 # send a data stream that tells the client something like this:
284 284 #
285 285 # a) apply this changegroup
286 286 # b) apply nodes XXX, YYY, ZZZ that you already have
287 287 # c) goto a
288 288 #
289 289 # until they've built up the full new state.
290 290 # Convert to revnums and intersect with "common". The client should
291 291 # have made it a subset of "common" already, but let's be safe.
292 292 known = set(repo.revs("%ln & ::%ln", known, common))
293 293 # TODO: we could send only roots() of this set, and the
294 294 # list of nodes in common, and the client could work out
295 295 # what to strip, instead of us explicitly sending every
296 296 # single node.
297 297 deadrevs = known
298 298 def genkills():
299 299 for r in deadrevs:
300 300 yield _KILLNODESIGNAL
301 301 yield repo.changelog.node(r)
302 302 yield _DONESIGNAL
303 303 bundler.newpart(_CHANGESPECPART, data=genkills())
304 304 newvisit, newfull, newellipsis = _computeellipsis(
305 305 repo, set(), common, known, newmatch)
306 306 if newvisit:
307 307 cg = _packellipsischangegroup(
308 308 repo, common, newmatch, newfull, newellipsis,
309 309 newvisit, depth, source, version)
310 310 part = bundler.newpart('changegroup', data=cg)
311 311 part.addparam('version', version)
312 312 if 'treemanifest' in repo.requirements:
313 313 part.addparam('treemanifest', '1')
314 314
315 315 visitnodes, relevant_nodes, ellipsisroots = _computeellipsis(
316 316 repo, common, heads, set(), newmatch, depth=depth)
317 317
318 318 repo.ui.debug('Found %d relevant revs\n' % len(relevant_nodes))
319 319 if visitnodes:
320 320 cg = _packellipsischangegroup(
321 321 repo, common, newmatch, relevant_nodes, ellipsisroots,
322 322 visitnodes, depth, source, version)
323 323 part = bundler.newpart('changegroup', data=cg)
324 324 part.addparam('version', version)
325 325 if 'treemanifest' in repo.requirements:
326 326 part.addparam('treemanifest', '1')
327 327
328 328 def applyacl_narrow(repo, kwargs):
329 329 ui = repo.ui
330 330 username = ui.shortuser(ui.environ.get('REMOTE_USER') or ui.username())
331 331 user_includes = ui.configlist(
332 332 _NARROWACL_SECTION, username + '.includes',
333 333 ui.configlist(_NARROWACL_SECTION, 'default.includes'))
334 334 user_excludes = ui.configlist(
335 335 _NARROWACL_SECTION, username + '.excludes',
336 336 ui.configlist(_NARROWACL_SECTION, 'default.excludes'))
337 337 if not user_includes:
338 338 raise error.Abort(_("{} configuration for user {} is empty")
339 339 .format(_NARROWACL_SECTION, username))
340 340
341 341 user_includes = [
342 342 'path:.' if p == '*' else 'path:' + p for p in user_includes]
343 343 user_excludes = [
344 344 'path:.' if p == '*' else 'path:' + p for p in user_excludes]
345 345
346 req_includes = set(kwargs.get('includepats', []))
347 req_excludes = set(kwargs.get('excludepats', []))
346 req_includes = set(kwargs.get(r'includepats', []))
347 req_excludes = set(kwargs.get(r'excludepats', []))
348 348
349 349 req_includes, req_excludes, invalid_includes = narrowspec.restrictpatterns(
350 350 req_includes, req_excludes, user_includes, user_excludes)
351 351
352 352 if invalid_includes:
353 353 raise error.Abort(
354 354 _("The following includes are not accessible for {}: {}")
355 355 .format(username, invalid_includes))
356 356
357 357 new_args = {}
358 358 new_args.update(kwargs)
359 359 new_args['includepats'] = req_includes
360 360 if req_excludes:
361 361 new_args['excludepats'] = req_excludes
362 362 return new_args
363 363
364 364 @bundle2.parthandler(_SPECPART, (_SPECPART_INCLUDE, _SPECPART_EXCLUDE))
365 365 def _handlechangespec_2(op, inpart):
366 366 includepats = set(inpart.params.get(_SPECPART_INCLUDE, '').splitlines())
367 367 excludepats = set(inpart.params.get(_SPECPART_EXCLUDE, '').splitlines())
368 368 narrowspec.save(op.repo, includepats, excludepats)
369 369 if not narrowrepo.REQUIREMENT in op.repo.requirements:
370 370 op.repo.requirements.add(narrowrepo.REQUIREMENT)
371 371 op.repo._writerequirements()
372 372 op.repo.invalidate(clearfilecache=True)
373 373
374 374 @bundle2.parthandler(_CHANGESPECPART)
375 375 def _handlechangespec(op, inpart):
376 376 repo = op.repo
377 377 cl = repo.changelog
378 378
379 379 # changesets which need to be stripped entirely. either they're no longer
380 380 # needed in the new narrow spec, or the server is sending a replacement
381 381 # in the changegroup part.
382 382 clkills = set()
383 383
384 384 # A changespec part contains all the updates to ellipsis nodes
385 385 # that will happen as a result of widening or narrowing a
386 386 # repo. All the changes that this block encounters are ellipsis
387 387 # nodes or flags to kill an existing ellipsis.
388 388 chunksignal = changegroup.readexactly(inpart, 4)
389 389 while chunksignal != _DONESIGNAL:
390 390 if chunksignal == _KILLNODESIGNAL:
391 391 # a node used to be an ellipsis but isn't anymore
392 392 ck = changegroup.readexactly(inpart, 20)
393 393 if cl.hasnode(ck):
394 394 clkills.add(ck)
395 395 else:
396 396 raise error.Abort(
397 397 _('unexpected changespec node chunk type: %s') % chunksignal)
398 398 chunksignal = changegroup.readexactly(inpart, 4)
399 399
400 400 if clkills:
401 401 # preserve bookmarks that repair.strip() would otherwise strip
402 402 bmstore = repo._bookmarks
403 403 class dummybmstore(dict):
404 404 def applychanges(self, repo, tr, changes):
405 405 pass
406 406 def recordchange(self, tr): # legacy version
407 407 pass
408 408 repo._bookmarks = dummybmstore()
409 409 chgrpfile = repair.strip(op.ui, repo, list(clkills), backup=True,
410 410 topic='widen')
411 411 repo._bookmarks = bmstore
412 412 if chgrpfile:
413 413 # presence of _widen_bundle attribute activates widen handler later
414 414 op._widen_bundle = chgrpfile
415 415 # Set the new narrowspec if we're widening. The setnewnarrowpats() method
416 416 # will currently always be there when using the core+narrowhg server, but
417 417 # other servers may include a changespec part even when not widening (e.g.
418 418 # because we're deepening a shallow repo).
419 419 if util.safehasattr(repo, 'setnewnarrowpats'):
420 420 repo.setnewnarrowpats()
421 421
422 422 def handlechangegroup_widen(op, inpart):
423 423 """Changegroup exchange handler which restores temporarily-stripped nodes"""
424 424 # We saved a bundle with stripped node data we must now restore.
425 425 # This approach is based on mercurial/repair.py@6ee26a53c111.
426 426 repo = op.repo
427 427 ui = op.ui
428 428
429 429 chgrpfile = op._widen_bundle
430 430 del op._widen_bundle
431 431 vfs = repo.vfs
432 432
433 433 ui.note(_("adding branch\n"))
434 434 f = vfs.open(chgrpfile, "rb")
435 435 try:
436 436 gen = exchange.readbundle(ui, f, chgrpfile, vfs)
437 437 if not ui.verbose:
438 438 # silence internal shuffling chatter
439 439 ui.pushbuffer()
440 440 if isinstance(gen, bundle2.unbundle20):
441 441 with repo.transaction('strip') as tr:
442 442 bundle2.processbundle(repo, gen, lambda: tr)
443 443 else:
444 444 gen.apply(repo, 'strip', 'bundle:' + vfs.join(chgrpfile), True)
445 445 if not ui.verbose:
446 446 ui.popbuffer()
447 447 finally:
448 448 f.close()
449 449
450 450 # remove undo files
451 451 for undovfs, undofile in repo.undofiles():
452 452 try:
453 453 undovfs.unlink(undofile)
454 454 except OSError as e:
455 455 if e.errno != errno.ENOENT:
456 456 ui.warn(_('error removing %s: %s\n') %
457 457 (undovfs.join(undofile), str(e)))
458 458
459 459 # Remove partial backup only if there were no exceptions
460 460 vfs.unlink(chgrpfile)
461 461
462 462 def setup():
463 463 """Enable narrow repo support in bundle2-related extension points."""
464 464 extensions.wrapfunction(bundle2, 'getrepocaps', getrepocaps_narrow)
465 465
466 466 wireproto.gboptsmap['narrow'] = 'boolean'
467 467 wireproto.gboptsmap['depth'] = 'plain'
468 468 wireproto.gboptsmap['oldincludepats'] = 'csv'
469 469 wireproto.gboptsmap['oldexcludepats'] = 'csv'
470 470 wireproto.gboptsmap['includepats'] = 'csv'
471 471 wireproto.gboptsmap['excludepats'] = 'csv'
472 472 wireproto.gboptsmap['known'] = 'csv'
473 473
474 474 # Extend changegroup serving to handle requests from narrow clients.
475 475 origcgfn = exchange.getbundle2partsmapping['changegroup']
476 476 def wrappedcgfn(*args, **kwargs):
477 477 repo = args[1]
478 478 if repo.ui.has_section(_NARROWACL_SECTION):
479 479 getbundlechangegrouppart_narrow(
480 480 *args, **applyacl_narrow(repo, kwargs))
481 481 elif kwargs.get(r'narrow', False):
482 482 getbundlechangegrouppart_narrow(*args, **kwargs)
483 483 else:
484 484 origcgfn(*args, **kwargs)
485 485 exchange.getbundle2partsmapping['changegroup'] = wrappedcgfn
486 486
487 487 # Extend changegroup receiver so client can fixup after widen requests.
488 488 origcghandler = bundle2.parthandlermapping['changegroup']
489 489 def wrappedcghandler(op, inpart):
490 490 origcghandler(op, inpart)
491 491 if util.safehasattr(op, '_widen_bundle'):
492 492 handlechangegroup_widen(op, inpart)
493 493 wrappedcghandler.params = origcghandler.params
494 494 bundle2.parthandlermapping['changegroup'] = wrappedcghandler
General Comments 0
You need to be logged in to leave comments. Login now