upstream/mercurial-mirror Commit - r38943:ad4c4cc9

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import weakref

12

import weakref

13

14

from .i18n import _

14

from .i18n import _

15

from .node import (

15

from .node import (

16

hex,

16

hex,

17

nullid,

17

nullid,

18

nullrev,

18

nullrev,

19

short,

19

short,

20

)

20

)

21

22

from .thirdparty import (

22

from .thirdparty import (

23

attr,

23

attr,

24

)

24

)

25

26

from . import (

26

from . import (

27

dagutil,

27

dagutil,

28

error,

28

error,

29

manifest,

29

manifest,

30

match as matchmod,

30

match as matchmod,

31

mdiff,

31

mdiff,

32

phases,

32

phases,

33

pycompat,

33

pycompat,

34

repository,

34

repository,

35

revlog,

35

revlog,

36

util,

36

util,

37

)

37

)

38

39

from .utils import (

39

from .utils import (

40

stringutil,

40

stringutil,

41

)

41

)

42

43

_CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")

43

_CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")

44

_CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")

44

_CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")

45

_CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")

45

_CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")

46

47

LFS_REQUIREMENT = 'lfs'

47

LFS_REQUIREMENT = 'lfs'

48

49

readexactly = util.readexactly

49

readexactly = util.readexactly

50

51

def getchunk(stream):

51

def getchunk(stream):

52

"""return the next chunk from stream as a string"""

52

"""return the next chunk from stream as a string"""

53

d = readexactly(stream, 4)

53

d = readexactly(stream, 4)

54

l = struct.unpack(">l", d)[0]

54

l = struct.unpack(">l", d)[0]

55

if l <= 4:

55

if l <= 4:

56

if l:

56

if l:

57

raise error.Abort(_("invalid chunk length %d") % l)

57

raise error.Abort(_("invalid chunk length %d") % l)

58

return ""

58

return ""

59

return readexactly(stream, l - 4)

59

return readexactly(stream, l - 4)

60

61

def chunkheader(length):

61

def chunkheader(length):

62

"""return a changegroup chunk header (string)"""

62

"""return a changegroup chunk header (string)"""

63

return struct.pack(">l", length + 4)

63

return struct.pack(">l", length + 4)

64

65

def closechunk():

65

def closechunk():

66

"""return a changegroup chunk header (string) for a zero-length chunk"""

66

"""return a changegroup chunk header (string) for a zero-length chunk"""

67

return struct.pack(">l", 0)

67

return struct.pack(">l", 0)

68

69

def writechunks(ui, chunks, filename, vfs=None):

69

def writechunks(ui, chunks, filename, vfs=None):

70

"""Write chunks to a file and return its filename.

70

"""Write chunks to a file and return its filename.

71

72

The stream is assumed to be a bundle file.

72

The stream is assumed to be a bundle file.

73

Existing files will not be overwritten.

73

Existing files will not be overwritten.

74

If no filename is specified, a temporary file is created.

74

If no filename is specified, a temporary file is created.

75

"""

75

"""

76

fh = None

76

fh = None

77

cleanup = None

77

cleanup = None

78

try:

78

try:

79

if filename:

79

if filename:

80

if vfs:

80

if vfs:

81

fh = vfs.open(filename, "wb")

81

fh = vfs.open(filename, "wb")

82

else:

82

else:

83

# Increase default buffer size because default is usually

83

# Increase default buffer size because default is usually

84

# small (4k is common on Linux).

84

# small (4k is common on Linux).

85

fh = open(filename, "wb", 131072)

85

fh = open(filename, "wb", 131072)

86

else:

86

else:

87

fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")

87

fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")

88

fh = os.fdopen(fd, r"wb")

88

fh = os.fdopen(fd, r"wb")

89

cleanup = filename

89

cleanup = filename

90

for c in chunks:

90

for c in chunks:

91

fh.write(c)

91

fh.write(c)

92

cleanup = None

92

cleanup = None

93

return filename

93

return filename

94

finally:

94

finally:

95

if fh is not None:

95

if fh is not None:

96

fh.close()

96

fh.close()

97

if cleanup is not None:

97

if cleanup is not None:

98

if filename and vfs:

98

if filename and vfs:

99

vfs.unlink(cleanup)

99

vfs.unlink(cleanup)

100

else:

100

else:

101

os.unlink(cleanup)

101

os.unlink(cleanup)

102

103

class cg1unpacker(object):

103

class cg1unpacker(object):

104

"""Unpacker for cg1 changegroup streams.

104

"""Unpacker for cg1 changegroup streams.

105

106

A changegroup unpacker handles the framing of the revision data in

106

A changegroup unpacker handles the framing of the revision data in

107

the wire format. Most consumers will want to use the apply()

107

the wire format. Most consumers will want to use the apply()

108

method to add the changes from the changegroup to a repository.

108

method to add the changes from the changegroup to a repository.

109

110

If you're forwarding a changegroup unmodified to another consumer,

110

If you're forwarding a changegroup unmodified to another consumer,

111

use getchunks(), which returns an iterator of changegroup

111

use getchunks(), which returns an iterator of changegroup

112

chunks. This is mostly useful for cases where you need to know the

112

chunks. This is mostly useful for cases where you need to know the

113

data stream has ended by observing the end of the changegroup.

113

data stream has ended by observing the end of the changegroup.

114

115

deltachunk() is useful only if you're applying delta data. Most

115

deltachunk() is useful only if you're applying delta data. Most

116

consumers should prefer apply() instead.

116

consumers should prefer apply() instead.

117

118

A few other public methods exist. Those are used only for

118

A few other public methods exist. Those are used only for

119

bundlerepo and some debug commands - their use is discouraged.

119

bundlerepo and some debug commands - their use is discouraged.

120

"""

120

"""

121

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

121

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

122

deltaheadersize = deltaheader.size

122

deltaheadersize = deltaheader.size

123

version = '01'

123

version = '01'

124

_grouplistcount = 1 # One list of files after the manifests

124

_grouplistcount = 1 # One list of files after the manifests

125

126

def __init__(self, fh, alg, extras=None):

126

def __init__(self, fh, alg, extras=None):

127

if alg is None:

127

if alg is None:

128

alg = 'UN'

128

alg = 'UN'

129

if alg not in util.compengines.supportedbundletypes:

129

if alg not in util.compengines.supportedbundletypes:

130

raise error.Abort(_('unknown stream compression type: %s')

130

raise error.Abort(_('unknown stream compression type: %s')

131

% alg)

131

% alg)

132

if alg == 'BZ':

132

if alg == 'BZ':

133

alg = '_truncatedBZ'

133

alg = '_truncatedBZ'

134

135

compengine = util.compengines.forbundletype(alg)

135

compengine = util.compengines.forbundletype(alg)

136

self._stream = compengine.decompressorreader(fh)

136

self._stream = compengine.decompressorreader(fh)

137

self._type = alg

137

self._type = alg

138

self.extras = extras or {}

138

self.extras = extras or {}

139

self.callback = None

139

self.callback = None

140

141

# These methods (compressed, read, seek, tell) all appear to only

141

# These methods (compressed, read, seek, tell) all appear to only

142

# be used by bundlerepo, but it's a little hard to tell.

142

# be used by bundlerepo, but it's a little hard to tell.

143

def compressed(self):

143

def compressed(self):

144

return self._type is not None and self._type != 'UN'

144

return self._type is not None and self._type != 'UN'

145

def read(self, l):

145

def read(self, l):

146

return self._stream.read(l)

146

return self._stream.read(l)

147

def seek(self, pos):

147

def seek(self, pos):

148

return self._stream.seek(pos)

148

return self._stream.seek(pos)

149

def tell(self):

149

def tell(self):

150

return self._stream.tell()

150

return self._stream.tell()

151

def close(self):

151

def close(self):

152

return self._stream.close()

152

return self._stream.close()

153

154

def _chunklength(self):

154

def _chunklength(self):

155

d = readexactly(self._stream, 4)

155

d = readexactly(self._stream, 4)

156

l = struct.unpack(">l", d)[0]

156

l = struct.unpack(">l", d)[0]

157

if l <= 4:

157

if l <= 4:

158

if l:

158

if l:

159

raise error.Abort(_("invalid chunk length %d") % l)

159

raise error.Abort(_("invalid chunk length %d") % l)

160

return 0

160

return 0

161

if self.callback:

161

if self.callback:

162

self.callback()

162

self.callback()

163

return l - 4

163

return l - 4

164

165

def changelogheader(self):

165

def changelogheader(self):

166

"""v10 does not have a changelog header chunk"""

166

"""v10 does not have a changelog header chunk"""

167

return {}

167

return {}

168

169

def manifestheader(self):

169

def manifestheader(self):

170

"""v10 does not have a manifest header chunk"""

170

"""v10 does not have a manifest header chunk"""

171

return {}

171

return {}

172

173

def filelogheader(self):

173

def filelogheader(self):

174

"""return the header of the filelogs chunk, v10 only has the filename"""

174

"""return the header of the filelogs chunk, v10 only has the filename"""

175

l = self._chunklength()

175

l = self._chunklength()

176

if not l:

176

if not l:

177

return {}

177

return {}

178

fname = readexactly(self._stream, l)

178

fname = readexactly(self._stream, l)

179

return {'filename': fname}

179

return {'filename': fname}

180

181

def _deltaheader(self, headertuple, prevnode):

181

def _deltaheader(self, headertuple, prevnode):

182

node, p1, p2, cs = headertuple

182

node, p1, p2, cs = headertuple

183

if prevnode is None:

183

if prevnode is None:

184

deltabase = p1

184

deltabase = p1

185

else:

185

else:

186

deltabase = prevnode

186

deltabase = prevnode

187

flags = 0

187

flags = 0

188

return node, p1, p2, deltabase, cs, flags

188

return node, p1, p2, deltabase, cs, flags

189

190

def deltachunk(self, prevnode):

190

def deltachunk(self, prevnode):

191

l = self._chunklength()

191

l = self._chunklength()

192

if not l:

192

if not l:

193

return {}

193

return {}

194

headerdata = readexactly(self._stream, self.deltaheadersize)

194

headerdata = readexactly(self._stream, self.deltaheadersize)

195

header = self.deltaheader.unpack(headerdata)

195

header = self.deltaheader.unpack(headerdata)

196

delta = readexactly(self._stream, l - self.deltaheadersize)

196

delta = readexactly(self._stream, l - self.deltaheadersize)

197

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

197

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

198

return (node, p1, p2, cs, deltabase, delta, flags)

198

return (node, p1, p2, cs, deltabase, delta, flags)

199

200

def getchunks(self):

200

def getchunks(self):

201

"""returns all the chunks contains in the bundle

201

"""returns all the chunks contains in the bundle

202

203

Used when you need to forward the binary stream to a file or another

203

Used when you need to forward the binary stream to a file or another

204

network API. To do so, it parse the changegroup data, otherwise it will

204

network API. To do so, it parse the changegroup data, otherwise it will

205

block in case of sshrepo because it don't know the end of the stream.

205

block in case of sshrepo because it don't know the end of the stream.

206

"""

206

"""

207

# For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,

207

# For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,

208

# and a list of filelogs. For changegroup 3, we expect 4 parts:

208

# and a list of filelogs. For changegroup 3, we expect 4 parts:

209

# changelog, manifestlog, a list of tree manifestlogs, and a list of

209

# changelog, manifestlog, a list of tree manifestlogs, and a list of

210

# filelogs.

210

# filelogs.

211

#

211

#

212

# Changelog and manifestlog parts are terminated with empty chunks. The

212

# Changelog and manifestlog parts are terminated with empty chunks. The

213

# tree and file parts are a list of entry sections. Each entry section

213

# tree and file parts are a list of entry sections. Each entry section

214

# is a series of chunks terminating in an empty chunk. The list of these

214

# is a series of chunks terminating in an empty chunk. The list of these

215

# entry sections is terminated in yet another empty chunk, so we know

215

# entry sections is terminated in yet another empty chunk, so we know

216

# we've reached the end of the tree/file list when we reach an empty

216

# we've reached the end of the tree/file list when we reach an empty

217

# chunk that was proceeded by no non-empty chunks.

217

# chunk that was proceeded by no non-empty chunks.

218

219

parts = 0

219

parts = 0

220

while parts < 2 + self._grouplistcount:

220

while parts < 2 + self._grouplistcount:

221

noentries = True

221

noentries = True

222

while True:

222

while True:

223

chunk = getchunk(self)

223

chunk = getchunk(self)

224

if not chunk:

224

if not chunk:

225

# The first two empty chunks represent the end of the

225

# The first two empty chunks represent the end of the

226

# changelog and the manifestlog portions. The remaining

226

# changelog and the manifestlog portions. The remaining

227

# empty chunks represent either A) the end of individual

227

# empty chunks represent either A) the end of individual

228

# tree or file entries in the file list, or B) the end of

228

# tree or file entries in the file list, or B) the end of

229

# the entire list. It's the end of the entire list if there

229

# the entire list. It's the end of the entire list if there

230

# were no entries (i.e. noentries is True).

230

# were no entries (i.e. noentries is True).

231

if parts < 2:

231

if parts < 2:

232

parts += 1

232

parts += 1

233

elif noentries:

233

elif noentries:

234

parts += 1

234

parts += 1

235

break

235

break

236

noentries = False

236

noentries = False

237

yield chunkheader(len(chunk))

237

yield chunkheader(len(chunk))

238

pos = 0

238

pos = 0

239

while pos < len(chunk):

239

while pos < len(chunk):

240

next = pos + 2**20

240

next = pos + 2**20

241

yield chunk[pos:next]

241

yield chunk[pos:next]

242

pos = next

242

pos = next

243

yield closechunk()

243

yield closechunk()

244

245

def _unpackmanifests(self, repo, revmap, trp, prog):

245

def _unpackmanifests(self, repo, revmap, trp, prog):

246

self.callback = prog.increment

246

self.callback = prog.increment

247

# no need to check for empty manifest group here:

247

# no need to check for empty manifest group here:

248

# if the result of the merge of 1 and 2 is the same in 3 and 4,

248

# if the result of the merge of 1 and 2 is the same in 3 and 4,

249

# no new manifest will be created and the manifest group will

249

# no new manifest will be created and the manifest group will

250

# be empty during the pull

250

# be empty during the pull

251

self.manifestheader()

251

self.manifestheader()

252

deltas = self.deltaiter()

252

deltas = self.deltaiter()

253

repo.manifestlog.addgroup(deltas, revmap, trp)

253

repo.manifestlog.addgroup(deltas, revmap, trp)

254

prog.complete()

254

prog.complete()

255

self.callback = None

255

self.callback = None

256

257

def apply(self, repo, tr, srctype, url, targetphase=phases.draft,

257

def apply(self, repo, tr, srctype, url, targetphase=phases.draft,

258

expectedtotal=None):

258

expectedtotal=None):

259

"""Add the changegroup returned by source.read() to this repo.

259

"""Add the changegroup returned by source.read() to this repo.

260

srctype is a string like 'push', 'pull', or 'unbundle'. url is

260

srctype is a string like 'push', 'pull', or 'unbundle'. url is

261

the URL of the repo where this changegroup is coming from.

261

the URL of the repo where this changegroup is coming from.

262

263

Return an integer summarizing the change to this repo:

263

Return an integer summarizing the change to this repo:

264

- nothing changed or no source: 0

264

- nothing changed or no source: 0

265

- more heads than before: 1+added heads (2..n)

265

- more heads than before: 1+added heads (2..n)

266

- fewer heads than before: -1-removed heads (-2..-n)

266

- fewer heads than before: -1-removed heads (-2..-n)

267

- number of heads stays the same: 1

267

- number of heads stays the same: 1

268

"""

268

"""

269

repo = repo.unfiltered()

269

repo = repo.unfiltered()

270

def csmap(x):

270

def csmap(x):

271

repo.ui.debug("add changeset %s\n" % short(x))

271

repo.ui.debug("add changeset %s\n" % short(x))

272

return len(cl)

272

return len(cl)

273

274

def revmap(x):

274

def revmap(x):

275

return cl.rev(x)

275

return cl.rev(x)

276

277

changesets = files = revisions = 0

277

changesets = files = revisions = 0

278

279

try:

279

try:

280

# The transaction may already carry source information. In this

280

# The transaction may already carry source information. In this

281

# case we use the top level data. We overwrite the argument

281

# case we use the top level data. We overwrite the argument

282

# because we need to use the top level value (if they exist)

282

# because we need to use the top level value (if they exist)

283

# in this function.

283

# in this function.

284

srctype = tr.hookargs.setdefault('source', srctype)

284

srctype = tr.hookargs.setdefault('source', srctype)

285

url = tr.hookargs.setdefault('url', url)

285

url = tr.hookargs.setdefault('url', url)

286

repo.hook('prechangegroup',

286

repo.hook('prechangegroup',

287

throw=True, **pycompat.strkwargs(tr.hookargs))

287

throw=True, **pycompat.strkwargs(tr.hookargs))

288

289

# write changelog data to temp files so concurrent readers

289

# write changelog data to temp files so concurrent readers

290

# will not see an inconsistent view

290

# will not see an inconsistent view

291

cl = repo.changelog

291

cl = repo.changelog

292

cl.delayupdate(tr)

292

cl.delayupdate(tr)

293

oldheads = set(cl.heads())

293

oldheads = set(cl.heads())

294

295

trp = weakref.proxy(tr)

295

trp = weakref.proxy(tr)

296

# pull off the changeset group

296

# pull off the changeset group

297

repo.ui.status(_("adding changesets\n"))

297

repo.ui.status(_("adding changesets\n"))

298

clstart = len(cl)

298

clstart = len(cl)

299

progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),

299

progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),

300

total=expectedtotal)

300

total=expectedtotal)

301

self.callback = progress.increment

301

self.callback = progress.increment

302

303

efiles = set()

303

efiles = set()

304

def onchangelog(cl, node):

304

def onchangelog(cl, node):

305

efiles.update(cl.readfiles(node))

305

efiles.update(cl.readfiles(node))

306

307

self.changelogheader()

307

self.changelogheader()

308

deltas = self.deltaiter()

308

deltas = self.deltaiter()

309

cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)

309

cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)

310

efiles = len(efiles)

310

efiles = len(efiles)

311

312

if not cgnodes:

312

if not cgnodes:

313

repo.ui.develwarn('applied empty changegroup',

313

repo.ui.develwarn('applied empty changegroup',

314

config='warn-empty-changegroup')

314

config='warn-empty-changegroup')

315

clend = len(cl)

315

clend = len(cl)

316

changesets = clend - clstart

316

changesets = clend - clstart

317

progress.complete()

317

progress.complete()

318

self.callback = None

318

self.callback = None

319

320

# pull off the manifest group

320

# pull off the manifest group

321

repo.ui.status(_("adding manifests\n"))

321

repo.ui.status(_("adding manifests\n"))

322

# We know that we'll never have more manifests than we had

322

# We know that we'll never have more manifests than we had

323

# changesets.

323

# changesets.

324

progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),

324

progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),

325

total=changesets)

325

total=changesets)

326

self._unpackmanifests(repo, revmap, trp, progress)

326

self._unpackmanifests(repo, revmap, trp, progress)

327

328

needfiles = {}

328

needfiles = {}

329

if repo.ui.configbool('server', 'validate'):

329

if repo.ui.configbool('server', 'validate'):

330

cl = repo.changelog

330

cl = repo.changelog

331

ml = repo.manifestlog

331

ml = repo.manifestlog

332

# validate incoming csets have their manifests

332

# validate incoming csets have their manifests

333

for cset in pycompat.xrange(clstart, clend):

333

for cset in pycompat.xrange(clstart, clend):

334

mfnode = cl.changelogrevision(cset).manifest

334

mfnode = cl.changelogrevision(cset).manifest

335

mfest = ml[mfnode].readdelta()

335

mfest = ml[mfnode].readdelta()

336

# store file cgnodes we must see

336

# store file cgnodes we must see

337

for f, n in mfest.iteritems():

337

for f, n in mfest.iteritems():

338

needfiles.setdefault(f, set()).add(n)

338

needfiles.setdefault(f, set()).add(n)

339

340

# process the files

340

# process the files

341

repo.ui.status(_("adding file changes\n"))

341

repo.ui.status(_("adding file changes\n"))

342

newrevs, newfiles = _addchangegroupfiles(

342

newrevs, newfiles = _addchangegroupfiles(

343

repo, self, revmap, trp, efiles, needfiles)

343

repo, self, revmap, trp, efiles, needfiles)

344

revisions += newrevs

344

revisions += newrevs

345

files += newfiles

345

files += newfiles

346

347

deltaheads = 0

347

deltaheads = 0

348

if oldheads:

348

if oldheads:

349

heads = cl.heads()

349

heads = cl.heads()

350

deltaheads = len(heads) - len(oldheads)

350

deltaheads = len(heads) - len(oldheads)

351

for h in heads:

351

for h in heads:

352

if h not in oldheads and repo[h].closesbranch():

352

if h not in oldheads and repo[h].closesbranch():

353

deltaheads -= 1

353

deltaheads -= 1

354

htext = ""

354

htext = ""

355

if deltaheads:

355

if deltaheads:

356

htext = _(" (%+d heads)") % deltaheads

356

htext = _(" (%+d heads)") % deltaheads

357

358

repo.ui.status(_("added %d changesets"

358

repo.ui.status(_("added %d changesets"

359

" with %d changes to %d files%s\n")

359

" with %d changes to %d files%s\n")

360

% (changesets, revisions, files, htext))

360

% (changesets, revisions, files, htext))

361

repo.invalidatevolatilesets()

361

repo.invalidatevolatilesets()

362

363

if changesets > 0:

363

if changesets > 0:

364

if 'node' not in tr.hookargs:

364

if 'node' not in tr.hookargs:

365

tr.hookargs['node'] = hex(cl.node(clstart))

365

tr.hookargs['node'] = hex(cl.node(clstart))

366

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

366

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

367

hookargs = dict(tr.hookargs)

367

hookargs = dict(tr.hookargs)

368

else:

368

else:

369

hookargs = dict(tr.hookargs)

369

hookargs = dict(tr.hookargs)

370

hookargs['node'] = hex(cl.node(clstart))

370

hookargs['node'] = hex(cl.node(clstart))

371

hookargs['node_last'] = hex(cl.node(clend - 1))

371

hookargs['node_last'] = hex(cl.node(clend - 1))

372

repo.hook('pretxnchangegroup',

372

repo.hook('pretxnchangegroup',

373

throw=True, **pycompat.strkwargs(hookargs))

373

throw=True, **pycompat.strkwargs(hookargs))

374

375

added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]

375

added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]

376

phaseall = None

376

phaseall = None

377

if srctype in ('push', 'serve'):

377

if srctype in ('push', 'serve'):

378

# Old servers can not push the boundary themselves.

378

# Old servers can not push the boundary themselves.

379

# New servers won't push the boundary if changeset already

379

# New servers won't push the boundary if changeset already

380

# exists locally as secret

380

# exists locally as secret

381

#

381

#

382

# We should not use added here but the list of all change in

382

# We should not use added here but the list of all change in

383

# the bundle

383

# the bundle

384

if repo.publishing():

384

if repo.publishing():

385

targetphase = phaseall = phases.public

385

targetphase = phaseall = phases.public

386

else:

386

else:

387

# closer target phase computation

387

# closer target phase computation

388

389

# Those changesets have been pushed from the

389

# Those changesets have been pushed from the

390

# outside, their phases are going to be pushed

390

# outside, their phases are going to be pushed

391

# alongside. Therefor `targetphase` is

391

# alongside. Therefor `targetphase` is

392

# ignored.

392

# ignored.

393

targetphase = phaseall = phases.draft

393

targetphase = phaseall = phases.draft

394

if added:

394

if added:

395

phases.registernew(repo, tr, targetphase, added)

395

phases.registernew(repo, tr, targetphase, added)

396

if phaseall is not None:

396

if phaseall is not None:

397

phases.advanceboundary(repo, tr, phaseall, cgnodes)

397

phases.advanceboundary(repo, tr, phaseall, cgnodes)

398

399

if changesets > 0:

399

if changesets > 0:

400

401

def runhooks():

401

def runhooks():

402

# These hooks run when the lock releases, not when the

402

# These hooks run when the lock releases, not when the

403

# transaction closes. So it's possible for the changelog

403

# transaction closes. So it's possible for the changelog

404

# to have changed since we last saw it.

404

# to have changed since we last saw it.

405

if clstart >= len(repo):

405

if clstart >= len(repo):

406

return

406

return

407

408

repo.hook("changegroup", **pycompat.strkwargs(hookargs))

408

repo.hook("changegroup", **pycompat.strkwargs(hookargs))

409

410

for n in added:

410

for n in added:

411

args = hookargs.copy()

411

args = hookargs.copy()

412

args['node'] = hex(n)

412

args['node'] = hex(n)

413

del args['node_last']

413

del args['node_last']

414

repo.hook("incoming", **pycompat.strkwargs(args))

414

repo.hook("incoming", **pycompat.strkwargs(args))

415

416

newheads = [h for h in repo.heads()

416

newheads = [h for h in repo.heads()

417

if h not in oldheads]

417

if h not in oldheads]

418

repo.ui.log("incoming",

418

repo.ui.log("incoming",

419

"%d incoming changes - new heads: %s\n",

419

"%d incoming changes - new heads: %s\n",

420

len(added),

420

len(added),

421

', '.join([hex(c[:6]) for c in newheads]))

421

', '.join([hex(c[:6]) for c in newheads]))

422

423

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

423

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

424

lambda tr: repo._afterlock(runhooks))

424

lambda tr: repo._afterlock(runhooks))

425

finally:

425

finally:

426

repo.ui.flush()

426

repo.ui.flush()

427

# never return 0 here:

427

# never return 0 here:

428

if deltaheads < 0:

428

if deltaheads < 0:

429

ret = deltaheads - 1

429

ret = deltaheads - 1

430

else:

430

else:

431

ret = deltaheads + 1

431

ret = deltaheads + 1

432

return ret

432

return ret

433

434

def deltaiter(self):

434

def deltaiter(self):

435

"""

435

"""

436

returns an iterator of the deltas in this changegroup

436

returns an iterator of the deltas in this changegroup

437

438

Useful for passing to the underlying storage system to be stored.

438

Useful for passing to the underlying storage system to be stored.

439

"""

439

"""

440

chain = None

440

chain = None

441

for chunkdata in iter(lambda: self.deltachunk(chain), {}):

441

for chunkdata in iter(lambda: self.deltachunk(chain), {}):

442

# Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)

442

# Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)

443

yield chunkdata

443

yield chunkdata

444

chain = chunkdata[0]

444

chain = chunkdata[0]

445

446

class cg2unpacker(cg1unpacker):

446

class cg2unpacker(cg1unpacker):

447

"""Unpacker for cg2 streams.

447

"""Unpacker for cg2 streams.

448

449

cg2 streams add support for generaldelta, so the delta header

449

cg2 streams add support for generaldelta, so the delta header

450

format is slightly different. All other features about the data

450

format is slightly different. All other features about the data

451

remain the same.

451

remain the same.

452

"""

452

"""

453

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

453

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

454

deltaheadersize = deltaheader.size

454

deltaheadersize = deltaheader.size

455

version = '02'

455

version = '02'

456

457

def _deltaheader(self, headertuple, prevnode):

457

def _deltaheader(self, headertuple, prevnode):

458

node, p1, p2, deltabase, cs = headertuple

458

node, p1, p2, deltabase, cs = headertuple

459

flags = 0

459

flags = 0

460

return node, p1, p2, deltabase, cs, flags

460

return node, p1, p2, deltabase, cs, flags

461

462

class cg3unpacker(cg2unpacker):

462

class cg3unpacker(cg2unpacker):

463

"""Unpacker for cg3 streams.

463

"""Unpacker for cg3 streams.

464

465

cg3 streams add support for exchanging treemanifests and revlog

465

cg3 streams add support for exchanging treemanifests and revlog

466

flags. It adds the revlog flags to the delta header and an empty chunk

466

flags. It adds the revlog flags to the delta header and an empty chunk

467

separating manifests and files.

467

separating manifests and files.

468

"""

468

"""

469

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

469

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

470

deltaheadersize = deltaheader.size

470

deltaheadersize = deltaheader.size

471

version = '03'

471

version = '03'

472

_grouplistcount = 2 # One list of manifests and one list of files

472

_grouplistcount = 2 # One list of manifests and one list of files

473

474

def _deltaheader(self, headertuple, prevnode):

474

def _deltaheader(self, headertuple, prevnode):

475

node, p1, p2, deltabase, cs, flags = headertuple

475

node, p1, p2, deltabase, cs, flags = headertuple

476

return node, p1, p2, deltabase, cs, flags

476

return node, p1, p2, deltabase, cs, flags

477

478

def _unpackmanifests(self, repo, revmap, trp, prog):

478

def _unpackmanifests(self, repo, revmap, trp, prog):

479

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)

479

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)

480

for chunkdata in iter(self.filelogheader, {}):

480

for chunkdata in iter(self.filelogheader, {}):

481

# If we get here, there are directory manifests in the changegroup

481

# If we get here, there are directory manifests in the changegroup

482

d = chunkdata["filename"]

482

d = chunkdata["filename"]

483

repo.ui.debug("adding %s revisions\n" % d)

483

repo.ui.debug("adding %s revisions\n" % d)

484

dirlog = repo.manifestlog._revlog.dirlog(d)

484

dirlog = repo.manifestlog._revlog.dirlog(d)

485

deltas = self.deltaiter()

485

deltas = self.deltaiter()

486

if not dirlog.addgroup(deltas, revmap, trp):

486

if not dirlog.addgroup(deltas, revmap, trp):

487

raise error.Abort(_("received dir revlog group is empty"))

487

raise error.Abort(_("received dir revlog group is empty"))

488

489

class headerlessfixup(object):

489

class headerlessfixup(object):

490

def __init__(self, fh, h):

490

def __init__(self, fh, h):

491

self._h = h

491

self._h = h

492

self._fh = fh

492

self._fh = fh

493

def read(self, n):

493

def read(self, n):

494

if self._h:

494

if self._h:

495

d, self._h = self._h[:n], self._h[n:]

495

d, self._h = self._h[:n], self._h[n:]

496

if len(d) < n:

496

if len(d) < n:

497

d += readexactly(self._fh, n - len(d))

497

d += readexactly(self._fh, n - len(d))

498

return d

498

return d

499

return readexactly(self._fh, n)

499

return readexactly(self._fh, n)

500

501

@attr.s(slots=True, frozen=True)

501

@attr.s(slots=True, frozen=True)

502

class revisiondelta(object):

502

class revisiondelta(object):

503

"""Describes a delta entry in a changegroup.

503

"""Describes a delta entry in a changegroup.

504

505

Captured data is sufficient to serialize the delta into multiple

505

Captured data is sufficient to serialize the delta into multiple

506

formats.

506

formats.

507

"""

507

"""

508

# 20 byte node of this revision.

508

# 20 byte node of this revision.

509

node = attr.ib()

509

node = attr.ib()

510

# 20 byte nodes of parent revisions.

510

# 20 byte nodes of parent revisions.

511

p1node = attr.ib()

511

p1node = attr.ib()

512

p2node = attr.ib()

512

p2node = attr.ib()

513

# 20 byte node of node this delta is against.

513

# 20 byte node of node this delta is against.

514

basenode = attr.ib()

514

basenode = attr.ib()

515

# 20 byte node of changeset revision this delta is associated with.

515

# 20 byte node of changeset revision this delta is associated with.

516

linknode = attr.ib()

516

linknode = attr.ib()

517

# 2 bytes of flags to apply to revision data.

517

# 2 bytes of flags to apply to revision data.

518

flags = attr.ib()

518

flags = attr.ib()

519

# Iterable of chunks holding raw delta data.

519

# Iterable of chunks holding raw delta data.

520

deltachunks = attr.ib()

520

deltachunks = attr.ib()

521

522

class cgpacker(object):

522

class cgpacker(object):

523

def __init__(self, repo, filematcher, version, allowreorder,

523

def __init__(self, repo, filematcher, version, allowreorder,

524

useprevdelta, builddeltaheader, manifestsend,

524

useprevdelta, builddeltaheader, manifestsend,

525

sendtreemanifests, bundlecaps=None, shallow=False):

525

sendtreemanifests, bundlecaps=None, shallow=False,

526

ellipsisroots=None):

526

"""Given a source repo, construct a bundler.

527

"""Given a source repo, construct a bundler.

527

528

filematcher is a matcher that matches on files to include in the

529

filematcher is a matcher that matches on files to include in the

529

changegroup. Used to facilitate sparse changegroups.

530

changegroup. Used to facilitate sparse changegroups.

530

531

allowreorder controls whether reordering of revisions is allowed.

532

allowreorder controls whether reordering of revisions is allowed.

532

This value is used when ``bundle.reorder`` is ``auto`` or isn't

533

This value is used when ``bundle.reorder`` is ``auto`` or isn't

533

set.

534

set.

534

535

useprevdelta controls whether revisions should always delta against

536

useprevdelta controls whether revisions should always delta against

536

the previous revision in the changegroup.

537

the previous revision in the changegroup.

537

538

builddeltaheader is a callable that constructs the header for a group

539

builddeltaheader is a callable that constructs the header for a group

539

delta.

540

delta.

540

541

manifestsend is a chunk to send after manifests have been fully emitted.

542

manifestsend is a chunk to send after manifests have been fully emitted.

542

543

sendtreemanifests indicates whether tree manifests should be emitted.

544

sendtreemanifests indicates whether tree manifests should be emitted.

544

545

bundlecaps is optional and can be used to specify the set of

546

bundlecaps is optional and can be used to specify the set of

546

capabilities which can be used to build the bundle. While bundlecaps is

547

capabilities which can be used to build the bundle. While bundlecaps is

547

unused in core Mercurial, extensions rely on this feature to communicate

548

unused in core Mercurial, extensions rely on this feature to communicate

548

capabilities to customize the changegroup packer.

549

capabilities to customize the changegroup packer.

549

550

shallow indicates whether shallow data might be sent. The packer may

551

shallow indicates whether shallow data might be sent. The packer may

551

need to pack file contents not introduced by the changes being packed.

552

need to pack file contents not introduced by the changes being packed.

552

"""

553

"""

553

assert filematcher

554

assert filematcher

554

self._filematcher = filematcher

555

self._filematcher = filematcher

555

556

self.version = version

557

self.version = version

557

self._useprevdelta = useprevdelta

558

self._useprevdelta = useprevdelta

558

self._builddeltaheader = builddeltaheader

559

self._builddeltaheader = builddeltaheader

559

self._manifestsend = manifestsend

560

self._manifestsend = manifestsend

560

self._sendtreemanifests = sendtreemanifests

561

self._sendtreemanifests = sendtreemanifests

561

562

# Set of capabilities we can use to build the bundle.

563

# Set of capabilities we can use to build the bundle.

563

if bundlecaps is None:

564

if bundlecaps is None:

564

bundlecaps = set()

565

bundlecaps = set()

565

self._bundlecaps = bundlecaps

566

self._bundlecaps = bundlecaps

566

self._isshallow = shallow

567

self._isshallow = shallow

567

568

569

# Maps ellipsis revs to their roots at the changelog level.

570

self._precomputedellipsis = ellipsisroots

571

568

# experimental config: bundle.reorder

572

# experimental config: bundle.reorder

569

reorder = repo.ui.config('bundle', 'reorder')

573

reorder = repo.ui.config('bundle', 'reorder')

570

if reorder == 'auto':

574

if reorder == 'auto':

571

self._reorder = allowreorder

575

self._reorder = allowreorder

572

else:

576

else:

573

self._reorder = stringutil.parsebool(reorder)

577

self._reorder = stringutil.parsebool(reorder)

574

578

575

self._repo = repo

579

self._repo = repo

576

580

577

if self._repo.ui.verbose and not self._repo.ui.debugflag:

581

if self._repo.ui.verbose and not self._repo.ui.debugflag:

578

self._verbosenote = self._repo.ui.note

582

self._verbosenote = self._repo.ui.note

579

else:

583

else:

580

self._verbosenote = lambda s: None

584

self._verbosenote = lambda s: None

581

585

582

# TODO the functionality keyed off of this should probably be

586

# TODO the functionality keyed off of this should probably be

583

# controlled via arguments to group() that influence behavior.

587

# controlled via arguments to group() that influence behavior.

584

self._changelogdone = False

588

self._changelogdone = False

585

589

586

# Maps CL revs to per-revlog revisions. Cleared in close() at

590

# Maps CL revs to per-revlog revisions. Cleared in close() at

587

# the end of each group.

591

# the end of each group.

588

self._clrevtolocalrev = {}

592

self._clrevtolocalrev = {}

589

self._nextclrevtolocalrev = {}

593

self._nextclrevtolocalrev = {}

590

594

591

# Maps changelog nodes to changelog revs. Filled in once

595

# Maps changelog nodes to changelog revs. Filled in once

592

# during changelog stage and then left unmodified.

596

# during changelog stage and then left unmodified.

593

self._clnodetorev = {}

597

self._clnodetorev = {}

594

598

595

def _close(self):

599

def _close(self):

596

# Ellipses serving mode.

600

# Ellipses serving mode.

597

self._clrevtolocalrev.clear()

601

self._clrevtolocalrev.clear()

598

if self._nextclrevtolocalrev:

602

if self._nextclrevtolocalrev:

599

self.clrevtolocalrev = self._nextclrevtolocalrev

603

self.clrevtolocalrev = self._nextclrevtolocalrev

600

self._nextclrevtolocalrev.clear()

604

self._nextclrevtolocalrev.clear()

601

self._changelogdone = True

605

self._changelogdone = True

602

606

603

return closechunk()

607

return closechunk()

604

608

605

def _fileheader(self, fname):

609

def _fileheader(self, fname):

606

return chunkheader(len(fname)) + fname

610

return chunkheader(len(fname)) + fname

607

611

608

# Extracted both for clarity and for overriding in extensions.

612

# Extracted both for clarity and for overriding in extensions.

609

def _sortgroup(self, store, nodelist, lookup):

613

def _sortgroup(self, store, nodelist, lookup):

610

"""Sort nodes for change group and turn them into revnums."""

614

"""Sort nodes for change group and turn them into revnums."""

611

# Ellipses serving mode.

615

# Ellipses serving mode.

612

#

616

#

613

# In a perfect world, we'd generate better ellipsis-ified graphs

617

# In a perfect world, we'd generate better ellipsis-ified graphs

614

# for non-changelog revlogs. In practice, we haven't started doing

618

# for non-changelog revlogs. In practice, we haven't started doing

615

# that yet, so the resulting DAGs for the manifestlog and filelogs

619

# that yet, so the resulting DAGs for the manifestlog and filelogs

616

# are actually full of bogus parentage on all the ellipsis

620

# are actually full of bogus parentage on all the ellipsis

617

# nodes. This has the side effect that, while the contents are

621

# nodes. This has the side effect that, while the contents are

618

# correct, the individual DAGs might be completely out of whack in

622

# correct, the individual DAGs might be completely out of whack in

619

# a case like 882681bc3166 and its ancestors (back about 10

623

# a case like 882681bc3166 and its ancestors (back about 10

620

# revisions or so) in the main hg repo.

624

# revisions or so) in the main hg repo.

621

#

625

#

622

# The one invariant we *know* holds is that the new (potentially

626

# The one invariant we *know* holds is that the new (potentially

623

# bogus) DAG shape will be valid if we order the nodes in the

627

# bogus) DAG shape will be valid if we order the nodes in the

624

# order that they're introduced in dramatis personae by the

628

# order that they're introduced in dramatis personae by the

625

# changelog, so what we do is we sort the non-changelog histories

629

# changelog, so what we do is we sort the non-changelog histories

626

# by the order in which they are used by the changelog.

630

# by the order in which they are used by the changelog.

627

if util.safehasattr(self, '_full_nodes') and self._clnodetorev:

631

if util.safehasattr(self, '_full_nodes') and self._clnodetorev:

628

key = lambda n: self._clnodetorev[lookup(n)]

632

key = lambda n: self._clnodetorev[lookup(n)]

629

return [store.rev(n) for n in sorted(nodelist, key=key)]

633

return [store.rev(n) for n in sorted(nodelist, key=key)]

630

634

631

# for generaldelta revlogs, we linearize the revs; this will both be

635

# for generaldelta revlogs, we linearize the revs; this will both be

632

# much quicker and generate a much smaller bundle

636

# much quicker and generate a much smaller bundle

633

if (store._generaldelta and self._reorder is None) or self._reorder:

637

if (store._generaldelta and self._reorder is None) or self._reorder:

634

dag = dagutil.revlogdag(store)

638

dag = dagutil.revlogdag(store)

635

return dag.linearize(set(store.rev(n) for n in nodelist))

639

return dag.linearize(set(store.rev(n) for n in nodelist))

636

else:

640

else:

637

return sorted([store.rev(n) for n in nodelist])

641

return sorted([store.rev(n) for n in nodelist])

638

642

639

def group(self, nodelist, store, lookup, units=None):

643

def group(self, nodelist, store, lookup, units=None):

640

"""Calculate a delta group, yielding a sequence of changegroup chunks

644

"""Calculate a delta group, yielding a sequence of changegroup chunks

641

(strings).

645

(strings).

642

646

643

Given a list of changeset revs, return a set of deltas and

647

Given a list of changeset revs, return a set of deltas and

644

metadata corresponding to nodes. The first delta is

648

metadata corresponding to nodes. The first delta is

645

first parent(nodelist[0]) -> nodelist[0], the receiver is

649

first parent(nodelist[0]) -> nodelist[0], the receiver is

646

guaranteed to have this parent as it has all history before

650

guaranteed to have this parent as it has all history before

647

these changesets. In the case firstparent is nullrev the

651

these changesets. In the case firstparent is nullrev the

648

changegroup starts with a full revision.

652

changegroup starts with a full revision.

649

653

650

If units is not None, progress detail will be generated, units specifies

654

If units is not None, progress detail will be generated, units specifies

651

the type of revlog that is touched (changelog, manifest, etc.).

655

the type of revlog that is touched (changelog, manifest, etc.).

652

"""

656

"""

653

# if we don't have any revisions touched by these changesets, bail

657

# if we don't have any revisions touched by these changesets, bail

654

if len(nodelist) == 0:

658

if len(nodelist) == 0:

655

yield self._close()

659

yield self._close()

656

return

660

return

657

661

658

revs = self._sortgroup(store, nodelist, lookup)

662

revs = self._sortgroup(store, nodelist, lookup)

659

663

660

# add the parent of the first rev

664

# add the parent of the first rev

661

p = store.parentrevs(revs[0])[0]

665

p = store.parentrevs(revs[0])[0]

662

revs.insert(0, p)

666

revs.insert(0, p)

663

667

664

# build deltas

668

# build deltas

665

progress = None

669

progress = None

666

if units is not None:

670

if units is not None:

667

progress = self._repo.ui.makeprogress(_('bundling'), unit=units,

671

progress = self._repo.ui.makeprogress(_('bundling'), unit=units,

668

total=(len(revs) - 1))

672

total=(len(revs) - 1))

669

for r in pycompat.xrange(len(revs) - 1):

673

for r in pycompat.xrange(len(revs) - 1):

670

if progress:

674

if progress:

671

progress.update(r + 1)

675

progress.update(r + 1)

672

prev, curr = revs[r], revs[r + 1]

676

prev, curr = revs[r], revs[r + 1]

673

linknode = lookup(store.node(curr))

677

linknode = lookup(store.node(curr))

674

for c in self._revchunk(store, curr, prev, linknode):

678

for c in self._revchunk(store, curr, prev, linknode):

675

yield c

679

yield c

676

680

677

if progress:

681

if progress:

678

progress.complete()

682

progress.complete()

679

yield self._close()

683

yield self._close()

680

684

681

# filter any nodes that claim to be part of the known set

685

# filter any nodes that claim to be part of the known set

682

def _prune(self, store, missing, commonrevs):

686

def _prune(self, store, missing, commonrevs):

683

# TODO this violates storage abstraction for manifests.

687

# TODO this violates storage abstraction for manifests.

684

if isinstance(store, manifest.manifestrevlog):

688

if isinstance(store, manifest.manifestrevlog):

685

if not self._filematcher.visitdir(store._dir[:-1] or '.'):

689

if not self._filematcher.visitdir(store._dir[:-1] or '.'):

686

return []

690

return []

687

691

688

rr, rl = store.rev, store.linkrev

692

rr, rl = store.rev, store.linkrev

689

return [n for n in missing if rl(rr(n)) not in commonrevs]

693

return [n for n in missing if rl(rr(n)) not in commonrevs]

690

694

691

def _packmanifests(self, dir, mfnodes, lookuplinknode):

695

def _packmanifests(self, dir, mfnodes, lookuplinknode):

692

"""Pack flat manifests into a changegroup stream."""

696

"""Pack flat manifests into a changegroup stream."""

693

assert not dir

697

assert not dir

694

for chunk in self.group(mfnodes, self._repo.manifestlog._revlog,

698

for chunk in self.group(mfnodes, self._repo.manifestlog._revlog,

695

lookuplinknode, units=_('manifests')):

699

lookuplinknode, units=_('manifests')):

696

yield chunk

700

yield chunk

697

701

698

def _packtreemanifests(self, dir, mfnodes, lookuplinknode):

702

def _packtreemanifests(self, dir, mfnodes, lookuplinknode):

699

"""Version of _packmanifests that operates on directory manifests.

703

"""Version of _packmanifests that operates on directory manifests.

700

704

701

Encodes the directory name in the output so multiple manifests

705

Encodes the directory name in the output so multiple manifests

702

can be sent.

706

can be sent.

703

"""

707

"""

704

assert self.version == b'03'

708

assert self.version == b'03'

705

709

706

if dir:

710

if dir:

707

yield self._fileheader(dir)

711

yield self._fileheader(dir)

708

712

709

# TODO violates storage abstractions by assuming revlogs.

713

# TODO violates storage abstractions by assuming revlogs.

710

dirlog = self._repo.manifestlog._revlog.dirlog(dir)

714

dirlog = self._repo.manifestlog._revlog.dirlog(dir)

711

for chunk in self.group(mfnodes, dirlog, lookuplinknode,

715

for chunk in self.group(mfnodes, dirlog, lookuplinknode,

712

units=_('manifests')):

716

units=_('manifests')):

713

yield chunk

717

yield chunk

714

718

715

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

719

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

716

'''yield a sequence of changegroup chunks (strings)'''

720

'''yield a sequence of changegroup chunks (strings)'''

717

repo = self._repo

721

repo = self._repo

718

cl = repo.changelog

722

cl = repo.changelog

719

723

720

clrevorder = {}

724

clrevorder = {}

721

mfs = {} # needed manifests

725

mfs = {} # needed manifests

722

fnodes = {} # needed file nodes

726

fnodes = {} # needed file nodes

723

mfl = repo.manifestlog

727

mfl = repo.manifestlog

724

# TODO violates storage abstraction.

728

# TODO violates storage abstraction.

725

mfrevlog = mfl._revlog

729

mfrevlog = mfl._revlog

726

changedfiles = set()

730

changedfiles = set()

727

731

728

ellipsesmode = util.safehasattr(self, '_full_nodes')

732

ellipsesmode = util.safehasattr(self, '_full_nodes')

729

733

730

# Callback for the changelog, used to collect changed files and

734

# Callback for the changelog, used to collect changed files and

731

# manifest nodes.

735

# manifest nodes.

732

# Returns the linkrev node (identity in the changelog case).

736

# Returns the linkrev node (identity in the changelog case).

733

def lookupcl(x):

737

def lookupcl(x):

734

c = cl.read(x)

738

c = cl.read(x)

735

clrevorder[x] = len(clrevorder)

739

clrevorder[x] = len(clrevorder)

736

740

737

if ellipsesmode:

741

if ellipsesmode:

738

# Only update mfs if x is going to be sent. Otherwise we

742

# Only update mfs if x is going to be sent. Otherwise we

739

# end up with bogus linkrevs specified for manifests and

743

# end up with bogus linkrevs specified for manifests and

740

# we skip some manifest nodes that we should otherwise

744

# we skip some manifest nodes that we should otherwise

741

# have sent.

745

# have sent.

742

if (x in self._full_nodes

746

if (x in self._full_nodes

743

or cl.rev(x) in self._precomputed_ellipsis):

747

or cl.rev(x) in self._precomputedellipsis):

744

n = c[0]

748

n = c[0]

745

# Record the first changeset introducing this manifest

749

# Record the first changeset introducing this manifest

746

# version.

750

# version.

747

mfs.setdefault(n, x)

751

mfs.setdefault(n, x)

748

# Set this narrow-specific dict so we have the lowest

752

# Set this narrow-specific dict so we have the lowest

749

# manifest revnum to look up for this cl revnum. (Part of

753

# manifest revnum to look up for this cl revnum. (Part of

750

# mapping changelog ellipsis parents to manifest ellipsis

754

# mapping changelog ellipsis parents to manifest ellipsis

751

# parents)

755

# parents)

752

self._nextclrevtolocalrev.setdefault(cl.rev(x),

756

self._nextclrevtolocalrev.setdefault(cl.rev(x),

753

mfrevlog.rev(n))

757

mfrevlog.rev(n))

754

# We can't trust the changed files list in the changeset if the

758

# We can't trust the changed files list in the changeset if the

755

# client requested a shallow clone.

759

# client requested a shallow clone.

756

if self._isshallow:

760

if self._isshallow:

757

changedfiles.update(mfl[c[0]].read().keys())

761

changedfiles.update(mfl[c[0]].read().keys())

758

else:

762

else:

759

changedfiles.update(c[3])

763

changedfiles.update(c[3])

760

else:

764

else:

761

765

762

n = c[0]

766

n = c[0]

763

# record the first changeset introducing this manifest version

767

# record the first changeset introducing this manifest version

764

mfs.setdefault(n, x)

768

mfs.setdefault(n, x)

765

# Record a complete list of potentially-changed files in

769

# Record a complete list of potentially-changed files in

766

# this manifest.

770

# this manifest.

767

changedfiles.update(c[3])

771

changedfiles.update(c[3])

768

772

769

return x

773

return x

770

774

771

self._verbosenote(_('uncompressed size of bundle content:\n'))

775

self._verbosenote(_('uncompressed size of bundle content:\n'))

772

size = 0

776

size = 0

773

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

777

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

774

size += len(chunk)

778

size += len(chunk)

775

yield chunk

779

yield chunk

776

self._verbosenote(_('%8.i (changelog)\n') % size)

780

self._verbosenote(_('%8.i (changelog)\n') % size)

777

781

778

# We need to make sure that the linkrev in the changegroup refers to

782

# We need to make sure that the linkrev in the changegroup refers to

779

# the first changeset that introduced the manifest or file revision.

783

# the first changeset that introduced the manifest or file revision.

780

# The fastpath is usually safer than the slowpath, because the filelogs

784

# The fastpath is usually safer than the slowpath, because the filelogs

781

# are walked in revlog order.

785

# are walked in revlog order.

782

#

786

#

783

# When taking the slowpath with reorder=None and the manifest revlog

787

# When taking the slowpath with reorder=None and the manifest revlog

784

# uses generaldelta, the manifest may be walked in the "wrong" order.

788

# uses generaldelta, the manifest may be walked in the "wrong" order.

785

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

789

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

786

# cc0ff93d0c0c).

790

# cc0ff93d0c0c).

787

#

791

#

788

# When taking the fastpath, we are only vulnerable to reordering

792

# When taking the fastpath, we are only vulnerable to reordering

789

# of the changelog itself. The changelog never uses generaldelta, so

793

# of the changelog itself. The changelog never uses generaldelta, so

790

# it is only reordered when reorder=True. To handle this case, we

794

# it is only reordered when reorder=True. To handle this case, we

791

# simply take the slowpath, which already has the 'clrevorder' logic.

795

# simply take the slowpath, which already has the 'clrevorder' logic.

792

# This was also fixed in cc0ff93d0c0c.

796

# This was also fixed in cc0ff93d0c0c.

793

fastpathlinkrev = fastpathlinkrev and not self._reorder

797

fastpathlinkrev = fastpathlinkrev and not self._reorder

794

# Treemanifests don't work correctly with fastpathlinkrev

798

# Treemanifests don't work correctly with fastpathlinkrev

795

# either, because we don't discover which directory nodes to

799

# either, because we don't discover which directory nodes to

796

# send along with files. This could probably be fixed.

800

# send along with files. This could probably be fixed.

797

fastpathlinkrev = fastpathlinkrev and (

801

fastpathlinkrev = fastpathlinkrev and (

798

'treemanifest' not in repo.requirements)

802

'treemanifest' not in repo.requirements)

799

803

800

for chunk in self.generatemanifests(commonrevs, clrevorder,

804

for chunk in self.generatemanifests(commonrevs, clrevorder,

801

fastpathlinkrev, mfs, fnodes, source):

805

fastpathlinkrev, mfs, fnodes, source):

802

yield chunk

806

yield chunk

803

807

804

if ellipsesmode:

808

if ellipsesmode:

805

mfdicts = None

809

mfdicts = None

806

if self._isshallow:

810

if self._isshallow:

807

mfdicts = [(self._repo.manifestlog[n].read(), lr)

811

mfdicts = [(self._repo.manifestlog[n].read(), lr)

808

for (n, lr) in mfs.iteritems()]

812

for (n, lr) in mfs.iteritems()]

809

813

810

mfs.clear()

814

mfs.clear()

811

clrevs = set(cl.rev(x) for x in clnodes)

815

clrevs = set(cl.rev(x) for x in clnodes)

812

816

813

if not fastpathlinkrev:

817

if not fastpathlinkrev:

814

def linknodes(unused, fname):

818

def linknodes(unused, fname):

815

return fnodes.get(fname, {})

819

return fnodes.get(fname, {})

816

else:

820

else:

817

cln = cl.node

821

cln = cl.node

818

def linknodes(filerevlog, fname):

822

def linknodes(filerevlog, fname):

819

llr = filerevlog.linkrev

823

llr = filerevlog.linkrev

820

fln = filerevlog.node

824

fln = filerevlog.node

821

revs = ((r, llr(r)) for r in filerevlog)

825

revs = ((r, llr(r)) for r in filerevlog)

822

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

826

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

823

827

824

if ellipsesmode:

828

if ellipsesmode:

825

# We need to pass the mfdicts variable down into

829

# We need to pass the mfdicts variable down into

826

# generatefiles(), but more than one command might have

830

# generatefiles(), but more than one command might have

827

# wrapped generatefiles so we can't modify the function

831

# wrapped generatefiles so we can't modify the function

828

# signature. Instead, we pass the data to ourselves using an

832

# signature. Instead, we pass the data to ourselves using an

829

# instance attribute. I'm sorry.

833

# instance attribute. I'm sorry.

830

self._mfdicts = mfdicts

834

self._mfdicts = mfdicts

831

835

832

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

836

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

833

source):

837

source):

834

yield chunk

838

yield chunk

835

839

836

yield self._close()

840

yield self._close()

837

841

838

if clnodes:

842

if clnodes:

839

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

843

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

840

844

841

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

845

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

842

fnodes, source):

846

fnodes, source):

843

"""Returns an iterator of changegroup chunks containing manifests.

847

"""Returns an iterator of changegroup chunks containing manifests.

844

848

845

`source` is unused here, but is used by extensions like remotefilelog to

849

`source` is unused here, but is used by extensions like remotefilelog to

846

change what is sent based in pulls vs pushes, etc.

850

change what is sent based in pulls vs pushes, etc.

847

"""

851

"""

848

repo = self._repo

852

repo = self._repo

849

mfl = repo.manifestlog

853

mfl = repo.manifestlog

850

dirlog = mfl._revlog.dirlog

854

dirlog = mfl._revlog.dirlog

851

tmfnodes = {'': mfs}

855

tmfnodes = {'': mfs}

852

856

853

# Callback for the manifest, used to collect linkrevs for filelog

857

# Callback for the manifest, used to collect linkrevs for filelog

854

# revisions.

858

# revisions.

855

# Returns the linkrev node (collected in lookupcl).

859

# Returns the linkrev node (collected in lookupcl).

856

def makelookupmflinknode(dir, nodes):

860

def makelookupmflinknode(dir, nodes):

857

if fastpathlinkrev:

861

if fastpathlinkrev:

858

assert not dir

862

assert not dir

859

return mfs.__getitem__

863

return mfs.__getitem__

860

864

861

def lookupmflinknode(x):

865

def lookupmflinknode(x):

862

"""Callback for looking up the linknode for manifests.

866

"""Callback for looking up the linknode for manifests.

863

867

864

Returns the linkrev node for the specified manifest.

868

Returns the linkrev node for the specified manifest.

865

869

866

SIDE EFFECT:

870

SIDE EFFECT:

867

871

868

1) fclnodes gets populated with the list of relevant

872

1) fclnodes gets populated with the list of relevant

869

file nodes if we're not using fastpathlinkrev

873

file nodes if we're not using fastpathlinkrev

870

2) When treemanifests are in use, collects treemanifest nodes

874

2) When treemanifests are in use, collects treemanifest nodes

871

to send

875

to send

872

876

873

Note that this means manifests must be completely sent to

877

Note that this means manifests must be completely sent to

874

the client before you can trust the list of files and

878

the client before you can trust the list of files and

875

treemanifests to send.

879

treemanifests to send.

876

"""

880

"""

877

clnode = nodes[x]

881

clnode = nodes[x]

878

mdata = mfl.get(dir, x).readfast(shallow=True)

882

mdata = mfl.get(dir, x).readfast(shallow=True)

879

for p, n, fl in mdata.iterentries():

883

for p, n, fl in mdata.iterentries():

880

if fl == 't': # subdirectory manifest

884

if fl == 't': # subdirectory manifest

881

subdir = dir + p + '/'

885

subdir = dir + p + '/'

882

tmfclnodes = tmfnodes.setdefault(subdir, {})

886

tmfclnodes = tmfnodes.setdefault(subdir, {})

883

tmfclnode = tmfclnodes.setdefault(n, clnode)

887

tmfclnode = tmfclnodes.setdefault(n, clnode)

884

if clrevorder[clnode] < clrevorder[tmfclnode]:

888

if clrevorder[clnode] < clrevorder[tmfclnode]:

885

tmfclnodes[n] = clnode

889

tmfclnodes[n] = clnode

886

else:

890

else:

887

f = dir + p

891

f = dir + p

888

fclnodes = fnodes.setdefault(f, {})

892

fclnodes = fnodes.setdefault(f, {})

889

fclnode = fclnodes.setdefault(n, clnode)

893

fclnode = fclnodes.setdefault(n, clnode)

890

if clrevorder[clnode] < clrevorder[fclnode]:

894

if clrevorder[clnode] < clrevorder[fclnode]:

891

fclnodes[n] = clnode

895

fclnodes[n] = clnode

892

return clnode

896

return clnode

893

return lookupmflinknode

897

return lookupmflinknode

894

898

895

fn = (self._packtreemanifests if self._sendtreemanifests

899

fn = (self._packtreemanifests if self._sendtreemanifests

896

else self._packmanifests)

900

else self._packmanifests)

897

size = 0

901

size = 0

898

while tmfnodes:

902

while tmfnodes:

899

dir, nodes = tmfnodes.popitem()

903

dir, nodes = tmfnodes.popitem()

900

prunednodes = self._prune(dirlog(dir), nodes, commonrevs)

904

prunednodes = self._prune(dirlog(dir), nodes, commonrevs)

901

if not dir or prunednodes:

905

if not dir or prunednodes:

902

for x in fn(dir, prunednodes, makelookupmflinknode(dir, nodes)):

906

for x in fn(dir, prunednodes, makelookupmflinknode(dir, nodes)):

903

size += len(x)

907

size += len(x)

904

yield x

908

yield x

905

self._verbosenote(_('%8.i (manifests)\n') % size)

909

self._verbosenote(_('%8.i (manifests)\n') % size)

906

yield self._manifestsend

910

yield self._manifestsend

907

911

908

# The 'source' parameter is useful for extensions

912

# The 'source' parameter is useful for extensions

909

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

913

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

910

changedfiles = list(filter(self._filematcher, changedfiles))

914

changedfiles = list(filter(self._filematcher, changedfiles))

911

915

912

if self._isshallow:

916

if self._isshallow:

913

# See comment in generate() for why this sadness is a thing.

917

# See comment in generate() for why this sadness is a thing.

914

mfdicts = self._mfdicts

918

mfdicts = self._mfdicts

915

del self._mfdicts

919

del self._mfdicts

916

# In a shallow clone, the linknodes callback needs to also include

920

# In a shallow clone, the linknodes callback needs to also include

917

# those file nodes that are in the manifests we sent but weren't

921

# those file nodes that are in the manifests we sent but weren't

918

# introduced by those manifests.

922

# introduced by those manifests.

919

commonctxs = [self._repo[c] for c in commonrevs]

923

commonctxs = [self._repo[c] for c in commonrevs]

920

oldlinknodes = linknodes

924

oldlinknodes = linknodes

921

clrev = self._repo.changelog.rev

925

clrev = self._repo.changelog.rev

922

926

923

# Defining this function has a side-effect of overriding the

927

# Defining this function has a side-effect of overriding the

924

# function of the same name that was passed in as an argument.

928

# function of the same name that was passed in as an argument.

925

# TODO have caller pass in appropriate function.

929

# TODO have caller pass in appropriate function.

926

def linknodes(flog, fname):

930

def linknodes(flog, fname):

927

for c in commonctxs:

931

for c in commonctxs:

928

try:

932

try:

929

fnode = c.filenode(fname)

933

fnode = c.filenode(fname)

930

self._clrevtolocalrev[c.rev()] = flog.rev(fnode)

934

self._clrevtolocalrev[c.rev()] = flog.rev(fnode)

931

except error.ManifestLookupError:

935

except error.ManifestLookupError:

932

pass

936

pass

933

links = oldlinknodes(flog, fname)

937

links = oldlinknodes(flog, fname)

934

if len(links) != len(mfdicts):

938

if len(links) != len(mfdicts):

935

for mf, lr in mfdicts:

939

for mf, lr in mfdicts:

936

fnode = mf.get(fname, None)

940

fnode = mf.get(fname, None)

937

if fnode in links:

941

if fnode in links:

938

links[fnode] = min(links[fnode], lr, key=clrev)

942

links[fnode] = min(links[fnode], lr, key=clrev)

939

elif fnode:

943

elif fnode:

940

links[fnode] = lr

944

links[fnode] = lr

941

return links

945

return links

942

946

943

return self._generatefiles(changedfiles, linknodes, commonrevs, source)

947

return self._generatefiles(changedfiles, linknodes, commonrevs, source)

944

948

945

def _generatefiles(self, changedfiles, linknodes, commonrevs, source):

949

def _generatefiles(self, changedfiles, linknodes, commonrevs, source):

946

repo = self._repo

950

repo = self._repo

947

progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),

951

progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),

948

total=len(changedfiles))

952

total=len(changedfiles))

949

for i, fname in enumerate(sorted(changedfiles)):

953

for i, fname in enumerate(sorted(changedfiles)):

950

filerevlog = repo.file(fname)

954

filerevlog = repo.file(fname)

951

if not filerevlog:

955

if not filerevlog:

952

raise error.Abort(_("empty or missing file data for %s") %

956

raise error.Abort(_("empty or missing file data for %s") %

953

fname)

957

fname)

954

958

955

linkrevnodes = linknodes(filerevlog, fname)

959

linkrevnodes = linknodes(filerevlog, fname)

956

# Lookup for filenodes, we collected the linkrev nodes above in the

960

# Lookup for filenodes, we collected the linkrev nodes above in the

957

# fastpath case and with lookupmf in the slowpath case.

961

# fastpath case and with lookupmf in the slowpath case.

958

def lookupfilelog(x):

962

def lookupfilelog(x):

959

return linkrevnodes[x]

963

return linkrevnodes[x]

960

964

961

filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)

965

filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)

962

if filenodes:

966

if filenodes:

963

progress.update(i + 1, item=fname)

967

progress.update(i + 1, item=fname)

964

h = self._fileheader(fname)

968

h = self._fileheader(fname)

965

size = len(h)

969

size = len(h)

966

yield h

970

yield h

967

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

971

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

968

size += len(chunk)

972

size += len(chunk)

969

yield chunk

973

yield chunk

970

self._verbosenote(_('%8.i %s\n') % (size, fname))

974

self._verbosenote(_('%8.i %s\n') % (size, fname))

971

progress.complete()

975

progress.complete()

972

976

973

def _deltaparent(self, store, rev, p1, p2, prev):

977

def _deltaparent(self, store, rev, p1, p2, prev):

974

if self._useprevdelta:

978

if self._useprevdelta:

975

if not store.candelta(prev, rev):

979

if not store.candelta(prev, rev):

976

raise error.ProgrammingError(

980

raise error.ProgrammingError(

977

'cg1 should not be used in this case')

981

'cg1 should not be used in this case')

978

return prev

982

return prev

979

983

980

# Narrow ellipses mode.

984

# Narrow ellipses mode.

981

if util.safehasattr(self, '_full_nodes'):

985

if util.safehasattr(self, '_full_nodes'):

982

# TODO: send better deltas when in narrow mode.

986

# TODO: send better deltas when in narrow mode.

983

#

987

#

984

# changegroup.group() loops over revisions to send,

988

# changegroup.group() loops over revisions to send,

985

# including revisions we'll skip. What this means is that

989

# including revisions we'll skip. What this means is that

986

# `prev` will be a potentially useless delta base for all

990

# `prev` will be a potentially useless delta base for all

987

# ellipsis nodes, as the client likely won't have it. In

991

# ellipsis nodes, as the client likely won't have it. In

988

# the future we should do bookkeeping about which nodes

992

# the future we should do bookkeeping about which nodes

989

# have been sent to the client, and try to be

993

# have been sent to the client, and try to be

990

# significantly smarter about delta bases. This is

994

# significantly smarter about delta bases. This is

991

# slightly tricky because this same code has to work for

995

# slightly tricky because this same code has to work for

992

# all revlogs, and we don't have the linkrev/linknode here.

996

# all revlogs, and we don't have the linkrev/linknode here.

993

return p1

997

return p1

994

998

995

dp = store.deltaparent(rev)

999

dp = store.deltaparent(rev)

996

if dp == nullrev and store.storedeltachains:

1000

if dp == nullrev and store.storedeltachains:

997

# Avoid sending full revisions when delta parent is null. Pick prev

1001

# Avoid sending full revisions when delta parent is null. Pick prev

998

# in that case. It's tempting to pick p1 in this case, as p1 will

1002

# in that case. It's tempting to pick p1 in this case, as p1 will

999

# be smaller in the common case. However, computing a delta against

1003

# be smaller in the common case. However, computing a delta against

1000

# p1 may require resolving the raw text of p1, which could be

1004

# p1 may require resolving the raw text of p1, which could be

1001

# expensive. The revlog caches should have prev cached, meaning

1005

# expensive. The revlog caches should have prev cached, meaning

1002

# less CPU for changegroup generation. There is likely room to add

1006

# less CPU for changegroup generation. There is likely room to add

1003

# a flag and/or config option to control this behavior.

1007

# a flag and/or config option to control this behavior.

1004

base = prev

1008

base = prev

1005

elif dp == nullrev:

1009

elif dp == nullrev:

1006

# revlog is configured to use full snapshot for a reason,

1010

# revlog is configured to use full snapshot for a reason,

1007

# stick to full snapshot.

1011

# stick to full snapshot.

1008

base = nullrev

1012

base = nullrev

1009

elif dp not in (p1, p2, prev):

1013

elif dp not in (p1, p2, prev):

1010

# Pick prev when we can't be sure remote has the base revision.

1014

# Pick prev when we can't be sure remote has the base revision.

1011

return prev

1015

return prev

1012

else:

1016

else:

1013

base = dp

1017

base = dp

1014

1018

1015

if base != nullrev and not store.candelta(base, rev):

1019

if base != nullrev and not store.candelta(base, rev):

1016

base = nullrev

1020

base = nullrev

1017

1021

1018

return base

1022

return base

1019

1023

1020

def _revchunk(self, store, rev, prev, linknode):

1024

def _revchunk(self, store, rev, prev, linknode):

1021

if util.safehasattr(self, '_full_nodes'):

1025

if util.safehasattr(self, '_full_nodes'):

1022

fn = self._revisiondeltanarrow

1026

fn = self._revisiondeltanarrow

1023

else:

1027

else:

1024

fn = self._revisiondeltanormal

1028

fn = self._revisiondeltanormal

1025

1029

1026

delta = fn(store, rev, prev, linknode)

1030

delta = fn(store, rev, prev, linknode)

1027

if not delta:

1031

if not delta:

1028

return

1032

return

1029

1033

1030

meta = self._builddeltaheader(delta)

1034

meta = self._builddeltaheader(delta)

1031

l = len(meta) + sum(len(x) for x in delta.deltachunks)

1035

l = len(meta) + sum(len(x) for x in delta.deltachunks)

1032

1036

1033

yield chunkheader(l)

1037

yield chunkheader(l)

1034

yield meta

1038

yield meta

1035

for x in delta.deltachunks:

1039

for x in delta.deltachunks:

1036

yield x

1040

yield x

1037

1041

1038

def _revisiondeltanormal(self, store, rev, prev, linknode):

1042

def _revisiondeltanormal(self, store, rev, prev, linknode):

1039

node = store.node(rev)

1043

node = store.node(rev)

1040

p1, p2 = store.parentrevs(rev)

1044

p1, p2 = store.parentrevs(rev)

1041

base = self._deltaparent(store, rev, p1, p2, prev)

1045

base = self._deltaparent(store, rev, p1, p2, prev)

1042

1046

1043

prefix = ''

1047

prefix = ''

1044

if store.iscensored(base) or store.iscensored(rev):

1048

if store.iscensored(base) or store.iscensored(rev):

1045

try:

1049

try:

1046

delta = store.revision(node, raw=True)

1050

delta = store.revision(node, raw=True)

1047

except error.CensoredNodeError as e:

1051

except error.CensoredNodeError as e:

1048

delta = e.tombstone

1052

delta = e.tombstone

1049

if base == nullrev:

1053

if base == nullrev:

1050

prefix = mdiff.trivialdiffheader(len(delta))

1054

prefix = mdiff.trivialdiffheader(len(delta))

1051

else:

1055

else:

1052

baselen = store.rawsize(base)

1056

baselen = store.rawsize(base)

1053

prefix = mdiff.replacediffheader(baselen, len(delta))

1057

prefix = mdiff.replacediffheader(baselen, len(delta))

1054

elif base == nullrev:

1058

elif base == nullrev:

1055

delta = store.revision(node, raw=True)

1059

delta = store.revision(node, raw=True)

1056

prefix = mdiff.trivialdiffheader(len(delta))

1060

prefix = mdiff.trivialdiffheader(len(delta))

1057

else:

1061

else:

1058

delta = store.revdiff(base, rev)

1062

delta = store.revdiff(base, rev)

1059

p1n, p2n = store.parents(node)

1063

p1n, p2n = store.parents(node)

1060

1064

1061

return revisiondelta(

1065

return revisiondelta(

1062

node=node,

1066

node=node,

1063

p1node=p1n,

1067

p1node=p1n,

1064

p2node=p2n,

1068

p2node=p2n,

1065

basenode=store.node(base),

1069

basenode=store.node(base),

1066

linknode=linknode,

1070

linknode=linknode,

1067

flags=store.flags(rev),

1071

flags=store.flags(rev),

1068

deltachunks=(prefix, delta),

1072

deltachunks=(prefix, delta),

1069

)

1073

)

1070

1074

1071

def _revisiondeltanarrow(self, store, rev, prev, linknode):

1075

def _revisiondeltanarrow(self, store, rev, prev, linknode):

1072

# build up some mapping information that's useful later. See

1076

# build up some mapping information that's useful later. See

1073

# the local() nested function below.

1077

# the local() nested function below.

1074

if not self._changelogdone:

1078

if not self._changelogdone:

1075

self._clnodetorev[linknode] = rev

1079

self._clnodetorev[linknode] = rev

1076

linkrev = rev

1080

linkrev = rev

1077

self._clrevtolocalrev[linkrev] = rev

1081

self._clrevtolocalrev[linkrev] = rev

1078

else:

1082

else:

1079

linkrev = self._clnodetorev[linknode]

1083

linkrev = self._clnodetorev[linknode]

1080

self._clrevtolocalrev[linkrev] = rev

1084

self._clrevtolocalrev[linkrev] = rev

1081

1085

1082

# This is a node to send in full, because the changeset it

1086

# This is a node to send in full, because the changeset it

1083

# corresponds to was a full changeset.

1087

# corresponds to was a full changeset.

1084

if linknode in self._full_nodes:

1088

if linknode in self._full_nodes:

1085

return self._revisiondeltanormal(store, rev, prev, linknode)

1089

return self._revisiondeltanormal(store, rev, prev, linknode)

1086

1090

1087

# At this point, a node can either be one we should skip or an

1091

# At this point, a node can either be one we should skip or an

1088

# ellipsis. If it's not an ellipsis, bail immediately.

1092

# ellipsis. If it's not an ellipsis, bail immediately.

1089

if linkrev not in self._precomputed_ellipsis:

1093

if linkrev not in self._precomputedellipsis:

1090

return

1094

return

1091

1095

1092

linkparents = self._precomputed_ellipsis[linkrev]

1096

linkparents = self._precomputedellipsis[linkrev]

1093

def local(clrev):

1097

def local(clrev):

1094

"""Turn a changelog revnum into a local revnum.

1098

"""Turn a changelog revnum into a local revnum.

1095

1099

1096

The ellipsis dag is stored as revnums on the changelog,

1100

The ellipsis dag is stored as revnums on the changelog,

1097

but when we're producing ellipsis entries for

1101

but when we're producing ellipsis entries for

1098

non-changelog revlogs, we need to turn those numbers into

1102

non-changelog revlogs, we need to turn those numbers into

1099

something local. This does that for us, and during the

1103

something local. This does that for us, and during the

1100

changelog sending phase will also expand the stored

1104

changelog sending phase will also expand the stored

1101

mappings as needed.

1105

mappings as needed.

1102

"""

1106

"""

1103

if clrev == nullrev:

1107

if clrev == nullrev:

1104

return nullrev

1108

return nullrev

1105

1109

1106

if not self._changelogdone:

1110

if not self._changelogdone:

1107

# If we're doing the changelog, it's possible that we

1111

# If we're doing the changelog, it's possible that we

1108

# have a parent that is already on the client, and we

1112

# have a parent that is already on the client, and we

1109

# need to store some extra mapping information so that

1113

# need to store some extra mapping information so that

1110

# our contained ellipsis nodes will be able to resolve

1114

# our contained ellipsis nodes will be able to resolve

1111

# their parents.

1115

# their parents.

1112

if clrev not in self._clrevtolocalrev:

1116

if clrev not in self._clrevtolocalrev:

1113

clnode = store.node(clrev)

1117

clnode = store.node(clrev)

1114

self._clnodetorev[clnode] = clrev

1118

self._clnodetorev[clnode] = clrev

1115

return clrev

1119

return clrev

1116

1120

1117

# Walk the ellipsis-ized changelog breadth-first looking for a

1121

# Walk the ellipsis-ized changelog breadth-first looking for a

1118

# change that has been linked from the current revlog.

1122

# change that has been linked from the current revlog.

1119

#

1123

#

1120

# For a flat manifest revlog only a single step should be necessary

1124

# For a flat manifest revlog only a single step should be necessary

1121

# as all relevant changelog entries are relevant to the flat

1125

# as all relevant changelog entries are relevant to the flat

1122

# manifest.

1126

# manifest.

1123

#

1127

#

1124

# For a filelog or tree manifest dirlog however not every changelog

1128

# For a filelog or tree manifest dirlog however not every changelog

1125

# entry will have been relevant, so we need to skip some changelog

1129

# entry will have been relevant, so we need to skip some changelog

1126

# nodes even after ellipsis-izing.

1130

# nodes even after ellipsis-izing.

1127

walk = [clrev]

1131

walk = [clrev]

1128

while walk:

1132

while walk:

1129

p = walk[0]

1133

p = walk[0]

1130

walk = walk[1:]

1134

walk = walk[1:]

1131

if p in self._clrevtolocalrev:

1135

if p in self._clrevtolocalrev:

1132

return self._clrevtolocalrev[p]

1136

return self._clrevtolocalrev[p]

1133

elif p in self._full_nodes:

1137

elif p in self._full_nodes:

1134

walk.extend([pp for pp in self._repo.changelog.parentrevs(p)

1138

walk.extend([pp for pp in self._repo.changelog.parentrevs(p)

1135

if pp != nullrev])

1139

if pp != nullrev])

1136

elif p in self._precomputed_ellipsis:

1140

elif p in self._precomputedellipsis:

1137

walk.extend([pp for pp in self._precomputed_ellipsis[p]

1141

walk.extend([pp for pp in self._precomputedellipsis[p]

1138

if pp != nullrev])

1142

if pp != nullrev])

1139

else:

1143

else:

1140

# In this case, we've got an ellipsis with parents

1144

# In this case, we've got an ellipsis with parents

1141

# outside the current bundle (likely an

1145

# outside the current bundle (likely an

1142

# incremental pull). We "know" that we can use the

1146

# incremental pull). We "know" that we can use the

1143

# value of this same revlog at whatever revision

1147

# value of this same revlog at whatever revision

1144

# is pointed to by linknode. "Know" is in scare

1148

# is pointed to by linknode. "Know" is in scare

1145

# quotes because I haven't done enough examination

1149

# quotes because I haven't done enough examination

1146

# of edge cases to convince myself this is really

1150

# of edge cases to convince myself this is really

1147

# a fact - it works for all the (admittedly

1151

# a fact - it works for all the (admittedly

1148

# thorough) cases in our testsuite, but I would be

1152

# thorough) cases in our testsuite, but I would be

1149

# somewhat unsurprised to find a case in the wild

1153

# somewhat unsurprised to find a case in the wild

1150

# where this breaks down a bit. That said, I don't

1154

# where this breaks down a bit. That said, I don't

1151

# know if it would hurt anything.

1155

# know if it would hurt anything.

1152

for i in pycompat.xrange(rev, 0, -1):

1156

for i in pycompat.xrange(rev, 0, -1):

1153

if store.linkrev(i) == clrev:

1157

if store.linkrev(i) == clrev:

1154

return i

1158

return i

1155

# We failed to resolve a parent for this node, so

1159

# We failed to resolve a parent for this node, so

1156

# we crash the changegroup construction.

1160

# we crash the changegroup construction.

1157

raise error.Abort(

1161

raise error.Abort(

1158

'unable to resolve parent while packing %r %r'

1162

'unable to resolve parent while packing %r %r'

1159

' for changeset %r' % (store.indexfile, rev, clrev))

1163

' for changeset %r' % (store.indexfile, rev, clrev))

1160

1164

1161

return nullrev

1165

return nullrev

1162

1166

1163

if not linkparents or (

1167

if not linkparents or (

1164

store.parentrevs(rev) == (nullrev, nullrev)):

1168

store.parentrevs(rev) == (nullrev, nullrev)):

1165

p1, p2 = nullrev, nullrev

1169

p1, p2 = nullrev, nullrev

1166

elif len(linkparents) == 1:

1170

elif len(linkparents) == 1:

1167

p1, = sorted(local(p) for p in linkparents)

1171

p1, = sorted(local(p) for p in linkparents)

1168

p2 = nullrev

1172

p2 = nullrev

1169

else:

1173

else:

1170

p1, p2 = sorted(local(p) for p in linkparents)

1174

p1, p2 = sorted(local(p) for p in linkparents)

1171

1175

1172

n = store.node(rev)

1176

n = store.node(rev)

1173

p1n, p2n = store.node(p1), store.node(p2)

1177

p1n, p2n = store.node(p1), store.node(p2)

1174

flags = store.flags(rev)

1178

flags = store.flags(rev)

1175

flags |= revlog.REVIDX_ELLIPSIS

1179

flags |= revlog.REVIDX_ELLIPSIS

1176

1180

1177

# TODO: try and actually send deltas for ellipsis data blocks

1181

# TODO: try and actually send deltas for ellipsis data blocks

1178

data = store.revision(n)

1182

data = store.revision(n)

1179

diffheader = mdiff.trivialdiffheader(len(data))

1183

diffheader = mdiff.trivialdiffheader(len(data))

1180

1184

1181

return revisiondelta(

1185

return revisiondelta(

1182

node=n,

1186

node=n,

1183

p1node=p1n,

1187

p1node=p1n,

1184

p2node=p2n,

1188

p2node=p2n,

1185

basenode=nullid,

1189

basenode=nullid,

1186

linknode=linknode,

1190

linknode=linknode,

1187

flags=flags,

1191

flags=flags,

1188

deltachunks=(diffheader, data),

1192

deltachunks=(diffheader, data),

1189

)

1193

)

1190

1194

1191

def _makecg1packer(repo, filematcher, bundlecaps, shallow=False):

1195

def _makecg1packer(repo, filematcher, bundlecaps, shallow=False,

1196

ellipsisroots=None):

1192

builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(

1197

builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(

1193

d.node, d.p1node, d.p2node, d.linknode)

1198

d.node, d.p1node, d.p2node, d.linknode)

1194

1199

1195

return cgpacker(repo, filematcher, b'01',

1200

return cgpacker(repo, filematcher, b'01',

1196

useprevdelta=True,

1201

useprevdelta=True,

1197

allowreorder=None,

1202

allowreorder=None,

1198

builddeltaheader=builddeltaheader,

1203

builddeltaheader=builddeltaheader,

1199

manifestsend=b'',

1204

manifestsend=b'',

1200

sendtreemanifests=False,

1205

sendtreemanifests=False,

1201

bundlecaps=bundlecaps,

1206

bundlecaps=bundlecaps,

1202

shallow=shallow)

1207

shallow=shallow,

1208

ellipsisroots=ellipsisroots)

1203

1209

1204

def _makecg2packer(repo, filematcher, bundlecaps, shallow=False):

1210

def _makecg2packer(repo, filematcher, bundlecaps, shallow=False,

1211

ellipsisroots=None):

1205

builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(

1212

builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(

1206

d.node, d.p1node, d.p2node, d.basenode, d.linknode)

1213

d.node, d.p1node, d.p2node, d.basenode, d.linknode)

1207

1214

1208

# Since generaldelta is directly supported by cg2, reordering

1215

# Since generaldelta is directly supported by cg2, reordering

1209

# generally doesn't help, so we disable it by default (treating

1216

# generally doesn't help, so we disable it by default (treating

1210

# bundle.reorder=auto just like bundle.reorder=False).

1217

# bundle.reorder=auto just like bundle.reorder=False).

1211

return cgpacker(repo, filematcher, b'02',

1218

return cgpacker(repo, filematcher, b'02',

1212

useprevdelta=False,

1219

useprevdelta=False,

1213

allowreorder=False,

1220

allowreorder=False,

1214

builddeltaheader=builddeltaheader,

1221

builddeltaheader=builddeltaheader,

1215

manifestsend=b'',

1222

manifestsend=b'',

1216

sendtreemanifests=False,

1223

sendtreemanifests=False,

1217

bundlecaps=bundlecaps,

1224

bundlecaps=bundlecaps,

1218

shallow=shallow)

1225

shallow=shallow,

1226

ellipsisroots=ellipsisroots)

1219

1227

1220

def _makecg3packer(repo, filematcher, bundlecaps, shallow=False):

1228

def _makecg3packer(repo, filematcher, bundlecaps, shallow=False,

1229

ellipsisroots=None):

1221

builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(

1230

builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(

1222

d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)

1231

d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)

1223

1232

1224

return cgpacker(repo, filematcher, b'03',

1233

return cgpacker(repo, filematcher, b'03',

1225

useprevdelta=False,

1234

useprevdelta=False,

1226

allowreorder=False,

1235

allowreorder=False,

1227

builddeltaheader=builddeltaheader,

1236

builddeltaheader=builddeltaheader,

1228

manifestsend=closechunk(),

1237

manifestsend=closechunk(),

1229

sendtreemanifests=True,

1238

sendtreemanifests=True,

1230

bundlecaps=bundlecaps,

1239

bundlecaps=bundlecaps,

1231

shallow=shallow)

1240

shallow=shallow,

1241

ellipsisroots=ellipsisroots)

1232

1242

1233

_packermap = {'01': (_makecg1packer, cg1unpacker),

1243

_packermap = {'01': (_makecg1packer, cg1unpacker),

1234

# cg2 adds support for exchanging generaldelta

1244

# cg2 adds support for exchanging generaldelta

1235

'02': (_makecg2packer, cg2unpacker),

1245

'02': (_makecg2packer, cg2unpacker),

1236

# cg3 adds support for exchanging revlog flags and treemanifests

1246

# cg3 adds support for exchanging revlog flags and treemanifests

1237

'03': (_makecg3packer, cg3unpacker),

1247

'03': (_makecg3packer, cg3unpacker),

1238

}

1248

}

1239

1249

1240

def allsupportedversions(repo):

1250

def allsupportedversions(repo):

1241

versions = set(_packermap.keys())

1251

versions = set(_packermap.keys())

1242

if not (repo.ui.configbool('experimental', 'changegroup3') or

1252

if not (repo.ui.configbool('experimental', 'changegroup3') or

1243

repo.ui.configbool('experimental', 'treemanifest') or

1253

repo.ui.configbool('experimental', 'treemanifest') or

1244

'treemanifest' in repo.requirements):

1254

'treemanifest' in repo.requirements):

1245

versions.discard('03')

1255

versions.discard('03')

1246

return versions

1256

return versions

1247

1257

1248

# Changegroup versions that can be applied to the repo

1258

# Changegroup versions that can be applied to the repo

1249

def supportedincomingversions(repo):

1259

def supportedincomingversions(repo):

1250

return allsupportedversions(repo)

1260

return allsupportedversions(repo)

1251

1261

1252

# Changegroup versions that can be created from the repo

1262

# Changegroup versions that can be created from the repo

1253

def supportedoutgoingversions(repo):

1263

def supportedoutgoingversions(repo):

1254

versions = allsupportedversions(repo)

1264

versions = allsupportedversions(repo)

1255

if 'treemanifest' in repo.requirements:

1265

if 'treemanifest' in repo.requirements:

1256

# Versions 01 and 02 support only flat manifests and it's just too

1266

# Versions 01 and 02 support only flat manifests and it's just too

1257

# expensive to convert between the flat manifest and tree manifest on

1267

# expensive to convert between the flat manifest and tree manifest on

1258

# the fly. Since tree manifests are hashed differently, all of history

1268

# the fly. Since tree manifests are hashed differently, all of history

1259

# would have to be converted. Instead, we simply don't even pretend to

1269

# would have to be converted. Instead, we simply don't even pretend to

1260

# support versions 01 and 02.

1270

# support versions 01 and 02.

1261

versions.discard('01')

1271

versions.discard('01')

1262

versions.discard('02')

1272

versions.discard('02')

1263

if repository.NARROW_REQUIREMENT in repo.requirements:

1273

if repository.NARROW_REQUIREMENT in repo.requirements:

1264

# Versions 01 and 02 don't support revlog flags, and we need to

1274

# Versions 01 and 02 don't support revlog flags, and we need to

1265

# support that for stripping and unbundling to work.

1275

# support that for stripping and unbundling to work.

1266

versions.discard('01')

1276

versions.discard('01')

1267

versions.discard('02')

1277

versions.discard('02')

1268

if LFS_REQUIREMENT in repo.requirements:

1278

if LFS_REQUIREMENT in repo.requirements:

1269

# Versions 01 and 02 don't support revlog flags, and we need to

1279

# Versions 01 and 02 don't support revlog flags, and we need to

1270

# mark LFS entries with REVIDX_EXTSTORED.

1280

# mark LFS entries with REVIDX_EXTSTORED.

1271

versions.discard('01')

1281

versions.discard('01')

1272

versions.discard('02')

1282

versions.discard('02')

1273

1283

1274

return versions

1284

return versions

1275

1285

1276

def localversion(repo):

1286

def localversion(repo):

1277

# Finds the best version to use for bundles that are meant to be used

1287

# Finds the best version to use for bundles that are meant to be used

1278

# locally, such as those from strip and shelve, and temporary bundles.

1288

# locally, such as those from strip and shelve, and temporary bundles.

1279

return max(supportedoutgoingversions(repo))

1289

return max(supportedoutgoingversions(repo))

1280

1290

1281

def safeversion(repo):

1291

def safeversion(repo):

1282

# Finds the smallest version that it's safe to assume clients of the repo

1292

# Finds the smallest version that it's safe to assume clients of the repo

1283

# will support. For example, all hg versions that support generaldelta also

1293

# will support. For example, all hg versions that support generaldelta also

1284

# support changegroup 02.

1294

# support changegroup 02.

1285

versions = supportedoutgoingversions(repo)

1295

versions = supportedoutgoingversions(repo)

1286

if 'generaldelta' in repo.requirements:

1296

if 'generaldelta' in repo.requirements:

1287

versions.discard('01')

1297

versions.discard('01')

1288

assert versions

1298

assert versions

1289

return min(versions)

1299

return min(versions)

1290

1300

1291

def getbundler(version, repo, bundlecaps=None, filematcher=None,

1301

def getbundler(version, repo, bundlecaps=None, filematcher=None,

1292

shallow=False):

1302

shallow=False, ellipsisroots=None):

1293

assert version in supportedoutgoingversions(repo)

1303

assert version in supportedoutgoingversions(repo)

1294

1304

1295

if filematcher is None:

1305

if filematcher is None:

1296

filematcher = matchmod.alwaysmatcher(repo.root, '')

1306

filematcher = matchmod.alwaysmatcher(repo.root, '')

1297

1307

1298

if version == '01' and not filematcher.always():

1308

if version == '01' and not filematcher.always():

1299

raise error.ProgrammingError('version 01 changegroups do not support '

1309

raise error.ProgrammingError('version 01 changegroups do not support '

1300

'sparse file matchers')

1310

'sparse file matchers')

1301

1311

1302

# Requested files could include files not in the local store. So

1312

# Requested files could include files not in the local store. So

1303

# filter those out.

1313

# filter those out.

1304

filematcher = matchmod.intersectmatchers(repo.narrowmatch(),

1314

filematcher = matchmod.intersectmatchers(repo.narrowmatch(),

1305

filematcher)

1315

filematcher)

1306

1316

1307

fn = _packermap[version][0]

1317

fn = _packermap[version][0]

1308

return fn(repo, filematcher, bundlecaps, shallow=shallow)

1318

return fn(repo, filematcher, bundlecaps, shallow=shallow,

1319

ellipsisroots=ellipsisroots)

1309

1320

1310

def getunbundler(version, fh, alg, extras=None):

1321

def getunbundler(version, fh, alg, extras=None):

1311

return _packermap[version][1](fh, alg, extras=extras)

1322

return _packermap[version][1](fh, alg, extras=extras)

1312

1323

1313

def _changegroupinfo(repo, nodes, source):

1324

def _changegroupinfo(repo, nodes, source):

1314

if repo.ui.verbose or source == 'bundle':

1325

if repo.ui.verbose or source == 'bundle':

1315

repo.ui.status(_("%d changesets found\n") % len(nodes))

1326

repo.ui.status(_("%d changesets found\n") % len(nodes))

1316

if repo.ui.debugflag:

1327

if repo.ui.debugflag:

1317

repo.ui.debug("list of changesets:\n")

1328

repo.ui.debug("list of changesets:\n")

1318

for node in nodes:

1329

for node in nodes:

1319

repo.ui.debug("%s\n" % hex(node))

1330

repo.ui.debug("%s\n" % hex(node))

1320

1331

1321

def makechangegroup(repo, outgoing, version, source, fastpath=False,

1332

def makechangegroup(repo, outgoing, version, source, fastpath=False,

1322

bundlecaps=None):

1333

bundlecaps=None):

1323

cgstream = makestream(repo, outgoing, version, source,

1334

cgstream = makestream(repo, outgoing, version, source,

1324

fastpath=fastpath, bundlecaps=bundlecaps)

1335

fastpath=fastpath, bundlecaps=bundlecaps)

1325

return getunbundler(version, util.chunkbuffer(cgstream), None,

1336

return getunbundler(version, util.chunkbuffer(cgstream), None,

1326

{'clcount': len(outgoing.missing) })

1337

{'clcount': len(outgoing.missing) })

1327

1338

1328

def makestream(repo, outgoing, version, source, fastpath=False,

1339

def makestream(repo, outgoing, version, source, fastpath=False,

1329

bundlecaps=None, filematcher=None):

1340

bundlecaps=None, filematcher=None):

1330

bundler = getbundler(version, repo, bundlecaps=bundlecaps,

1341

bundler = getbundler(version, repo, bundlecaps=bundlecaps,

1331

filematcher=filematcher)

1342

filematcher=filematcher)

1332

1343

1333

repo = repo.unfiltered()

1344

repo = repo.unfiltered()

1334

commonrevs = outgoing.common

1345

commonrevs = outgoing.common

1335

csets = outgoing.missing

1346

csets = outgoing.missing

1336

heads = outgoing.missingheads

1347

heads = outgoing.missingheads

1337

# We go through the fast path if we get told to, or if all (unfiltered

1348

# We go through the fast path if we get told to, or if all (unfiltered

1338

# heads have been requested (since we then know there all linkrevs will

1349

# heads have been requested (since we then know there all linkrevs will

1339

# be pulled by the client).

1350

# be pulled by the client).

1340

heads.sort()

1351

heads.sort()

1341

fastpathlinkrev = fastpath or (

1352

fastpathlinkrev = fastpath or (

1342

repo.filtername is None and heads == sorted(repo.heads()))

1353

repo.filtername is None and heads == sorted(repo.heads()))

1343

1354

1344

repo.hook('preoutgoing', throw=True, source=source)

1355

repo.hook('preoutgoing', throw=True, source=source)

1345

_changegroupinfo(repo, csets, source)

1356

_changegroupinfo(repo, csets, source)

1346

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1357

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1347

1358

1348

def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):

1359

def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):

1349

revisions = 0

1360

revisions = 0

1350

files = 0

1361

files = 0

1351

progress = repo.ui.makeprogress(_('files'), unit=_('files'),

1362

progress = repo.ui.makeprogress(_('files'), unit=_('files'),

1352

total=expectedfiles)

1363

total=expectedfiles)

1353

for chunkdata in iter(source.filelogheader, {}):

1364

for chunkdata in iter(source.filelogheader, {}):

1354

files += 1

1365

files += 1

1355

f = chunkdata["filename"]

1366

f = chunkdata["filename"]

1356

repo.ui.debug("adding %s revisions\n" % f)

1367

repo.ui.debug("adding %s revisions\n" % f)

1357

progress.increment()

1368

progress.increment()

1358

fl = repo.file(f)

1369

fl = repo.file(f)

1359

o = len(fl)

1370

o = len(fl)

1360

try:

1371

try:

1361

deltas = source.deltaiter()

1372

deltas = source.deltaiter()

1362

if not fl.addgroup(deltas, revmap, trp):

1373

if not fl.addgroup(deltas, revmap, trp):

1363

raise error.Abort(_("received file revlog group is empty"))

1374

raise error.Abort(_("received file revlog group is empty"))

1364

except error.CensoredBaseError as e:

1375

except error.CensoredBaseError as e:

1365

raise error.Abort(_("received delta base is censored: %s") % e)

1376

raise error.Abort(_("received delta base is censored: %s") % e)

1366

revisions += len(fl) - o

1377

revisions += len(fl) - o

1367

if f in needfiles:

1378

if f in needfiles:

1368

needs = needfiles[f]

1379

needs = needfiles[f]

1369

for new in pycompat.xrange(o, len(fl)):

1380

for new in pycompat.xrange(o, len(fl)):

1370

n = fl.node(new)

1381

n = fl.node(new)

1371

if n in needs:

1382

if n in needs:

1372

needs.remove(n)

1383

needs.remove(n)

1373

else:

1384

else:

1374

raise error.Abort(

1385

raise error.Abort(

1375

_("received spurious file revlog entry"))

1386

_("received spurious file revlog entry"))

1376

if not needs:

1387

if not needs:

1377

del needfiles[f]

1388

del needfiles[f]

1378

progress.complete()

1389

progress.complete()

1379

1390

1380

for f, needs in needfiles.iteritems():

1391

for f, needs in needfiles.iteritems():

1381

fl = repo.file(f)

1392

fl = repo.file(f)

1382

for n in needs:

1393

for n in needs:

1383

try:

1394

try:

1384

fl.rev(n)

1395

fl.rev(n)

1385

except error.LookupError:

1396

except error.LookupError:

1386

raise error.Abort(

1397

raise error.Abort(

1387

_('missing file data for %s:%s - run hg verify') %

1398

_('missing file data for %s:%s - run hg verify') %

1388

(f, hex(n)))

1399

(f, hex(n)))

1389

1400

1390

return revisions, files

1401

return revisions, files

1391

1402

1392

def _packellipsischangegroup(repo, common, match, relevant_nodes,

1403

def _packellipsischangegroup(repo, common, match, relevant_nodes,

1393

ellipsisroots, visitnodes, depth, source, version):

1404

ellipsisroots, visitnodes, depth, source, version):

1394

if version in ('01', '02'):

1405

if version in ('01', '02'):

1395

raise error.Abort(

1406

raise error.Abort(

1396

'ellipsis nodes require at least cg3 on client and server, '

1407

'ellipsis nodes require at least cg3 on client and server, '

1397

'but negotiated version %s' % version)

1408

'but negotiated version %s' % version)

1398

# We wrap cg1packer.revchunk, using a side channel to pass

1409

# We wrap cg1packer.revchunk, using a side channel to pass

1399

# relevant_nodes into that area. Then if linknode isn't in the

1410

# relevant_nodes into that area. Then if linknode isn't in the

1400

# set, we know we have an ellipsis node and we should defer

1411

# set, we know we have an ellipsis node and we should defer

1401

# sending that node's data. We override close() to detect

1412

# sending that node's data. We override close() to detect

1402

# pending ellipsis nodes and flush them.

1413

# pending ellipsis nodes and flush them.

1403

packer = getbundler(version, repo, filematcher=match,

1414

packer = getbundler(version, repo, filematcher=match,

1404

shallow=depth is not None)

1415

shallow=depth is not None,

1416

ellipsisroots=ellipsisroots)

1405

# Give the packer the list of nodes which should not be

1417

# Give the packer the list of nodes which should not be

1406

# ellipsis nodes. We store this rather than the set of nodes

1418

# ellipsis nodes. We store this rather than the set of nodes

1407

# that should be an ellipsis because for very large histories

1419

# that should be an ellipsis because for very large histories

1408

# we expect this to be significantly smaller.

1420

# we expect this to be significantly smaller.

1409

packer._full_nodes = relevant_nodes

1421

packer._full_nodes = relevant_nodes

1410

# Maps ellipsis revs to their roots at the changelog level.

1411

packer._precomputed_ellipsis = ellipsisroots

1412

1422

1413

return packer.generate(common, visitnodes, False, source)

1423

return packer.generate(common, visitnodes, False, source)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from .thirdparty import (
                 attr,
             )
             from . import (
                 dagutil,
                 error,
                 manifest,
                 match as matchmod,
                 mdiff,
                 phases,
                 pycompat,
                 repository,
                 revlog,
                 util,
             )
             from .utils import (
                 stringutil,
             )
             _CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")
             _CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")
             _CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")
             LFS_REQUIREMENT = 'lfs'
             readexactly = util.readexactly
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             # Increase default buffer size because default is usually
                             # small (4k is common on Linux).
                             fh = open(filename, "wb", 131072)
                     else:
                         fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, r"wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = deltaheader.size
                 version = '01'
                 _grouplistcount = 1 # One list of files after the manifests
                 def __init__(self, fh, alg, extras=None):
                     if alg is None:
                         alg = 'UN'
                     if alg not in util.compengines.supportedbundletypes:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     compengine = util.compengines.forbundletype(alg)
                     self._stream = compengine.decompressorreader(fh)
                     self._type = alg
                     self.extras = extras or {}
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None and self._type != 'UN'
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = self.deltaheader.unpack(headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
                     return (node, p1, p2, cs, deltabase, delta, flags)
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
                     # and a list of filelogs. For changegroup 3, we expect 4 parts:
                     # changelog, manifestlog, a list of tree manifestlogs, and a list of
                     # filelogs.
                     #
                     # Changelog and manifestlog parts are terminated with empty chunks. The
                     # tree and file parts are a list of entry sections. Each entry section
                     # is a series of chunks terminating in an empty chunk. The list of these
                     # entry sections is terminated in yet another empty chunk, so we know
                     # we've reached the end of the tree/file list when we reach an empty
                     # chunk that was proceeded by no non-empty chunks.
                     parts = 0
                     while parts < 2 + self._grouplistcount:
                         noentries = True
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 # The first two empty chunks represent the end of the
                                 # changelog and the manifestlog portions. The remaining
                                 # empty chunks represent either A) the end of individual
                                 # tree or file entries in the file list, or B) the end of
                                 # the entire list. It's the end of the entire list if there
                                 # were no entries (i.e. noentries is True).
                                 if parts < 2:
                                     parts += 1
                                 elif noentries:
                                     parts += 1
                                 break
                             noentries = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog):
                     self.callback = prog.increment
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     deltas = self.deltaiter()
                     repo.manifestlog.addgroup(deltas, revmap, trp)
                     prog.complete()
                     self.callback = None
                 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
                           expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     try:
                         # The transaction may already carry source information. In this
                         # case we use the top level data. We overwrite the argument
                         # because we need to use the top level value (if they exist)
                         # in this function.
                         srctype = tr.hookargs.setdefault('source', srctype)
                         url = tr.hookargs.setdefault('url', url)
                         repo.hook('prechangegroup',
                                   throw=True, **pycompat.strkwargs(tr.hookargs))
                         # write changelog data to temp files so concurrent readers
                         # will not see an inconsistent view
                         cl = repo.changelog
                         cl.delayupdate(tr)
                         oldheads = set(cl.heads())
                         trp = weakref.proxy(tr)
                         # pull off the changeset group
                         repo.ui.status(_("adding changesets\n"))
                         clstart = len(cl)
                         progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
                                                         total=expectedtotal)
                         self.callback = progress.increment
                         efiles = set()
                         def onchangelog(cl, node):
                             efiles.update(cl.readfiles(node))
                         self.changelogheader()
                         deltas = self.deltaiter()
                         cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
                         efiles = len(efiles)
                         if not cgnodes:
                             repo.ui.develwarn('applied empty changegroup',
                                               config='warn-empty-changegroup')
                         clend = len(cl)
                         changesets = clend - clstart
                         progress.complete()
                         self.callback = None
                         # pull off the manifest group
                         repo.ui.status(_("adding manifests\n"))
                         # We know that we'll never have more manifests than we had
                         # changesets.
                         progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
                                                         total=changesets)
                         self._unpackmanifests(repo, revmap, trp, progress)
                         needfiles = {}
                         if repo.ui.configbool('server', 'validate'):
                             cl = repo.changelog
                             ml = repo.manifestlog
                             # validate incoming csets have their manifests
                             for cset in pycompat.xrange(clstart, clend):
                                 mfnode = cl.changelogrevision(cset).manifest
                                 mfest = ml[mfnode].readdelta()
                                 # store file cgnodes we must see
                                 for f, n in mfest.iteritems():
                                     needfiles.setdefault(f, set()).add(n)
                         # process the files
                         repo.ui.status(_("adding file changes\n"))
                         newrevs, newfiles = _addchangegroupfiles(
                             repo, self, revmap, trp, efiles, needfiles)
                         revisions += newrevs
                         files += newfiles
                         deltaheads = 0
                         if oldheads:
                             heads = cl.heads()
                             deltaheads = len(heads) - len(oldheads)
                             for h in heads:
                                 if h not in oldheads and repo[h].closesbranch():
                                     deltaheads -= 1
                         htext = ""
                         if deltaheads:
                             htext = _(" (%+d heads)") % deltaheads
                         repo.ui.status(_("added %d changesets"
                                          " with %d changes to %d files%s\n")
                                          % (changesets, revisions, files, htext))
                         repo.invalidatevolatilesets()
                         if changesets > 0:
                             if 'node' not in tr.hookargs:
                                 tr.hookargs['node'] = hex(cl.node(clstart))
                                 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
                                 hookargs = dict(tr.hookargs)
                             else:
                                 hookargs = dict(tr.hookargs)
                                 hookargs['node'] = hex(cl.node(clstart))
                                 hookargs['node_last'] = hex(cl.node(clend - 1))
                             repo.hook('pretxnchangegroup',
                                       throw=True, **pycompat.strkwargs(hookargs))
                         added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
                         phaseall = None
                         if srctype in ('push', 'serve'):
                             # Old servers can not push the boundary themselves.
                             # New servers won't push the boundary if changeset already
                             # exists locally as secret
                             #
                             # We should not use added here but the list of all change in
                             # the bundle
                             if repo.publishing():
                                 targetphase = phaseall = phases.public
                             else:
                                 # closer target phase computation
                                 # Those changesets have been pushed from the
                                 # outside, their phases are going to be pushed
                                 # alongside. Therefor `targetphase` is
                                 # ignored.
                                 targetphase = phaseall = phases.draft
                         if added:
                             phases.registernew(repo, tr, targetphase, added)
                         if phaseall is not None:
                             phases.advanceboundary(repo, tr, phaseall, cgnodes)
                         if changesets > 0:
                             def runhooks():
                                 # These hooks run when the lock releases, not when the
                                 # transaction closes. So it's possible for the changelog
                                 # to have changed since we last saw it.
                                 if clstart >= len(repo):
                                     return
                                 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
                                 for n in added:
                                     args = hookargs.copy()
                                     args['node'] = hex(n)
                                     del args['node_last']
                                     repo.hook("incoming", **pycompat.strkwargs(args))
                                 newheads = [h for h in repo.heads()
                                             if h not in oldheads]
                                 repo.ui.log("incoming",
                                             "%d incoming changes - new heads: %s\n",
                                             len(added),
                                             ', '.join([hex(c[:6]) for c in newheads]))
                             tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                             lambda tr: repo._afterlock(runhooks))
                     finally:
                         repo.ui.flush()
                     # never return 0 here:
                     if deltaheads < 0:
                         ret = deltaheads - 1
                     else:
                         ret = deltaheads + 1
                     return ret
                 def deltaiter(self):
                     """
                     returns an iterator of the deltas in this changegroup
                     Useful for passing to the underlying storage system to be stored.
                     """
                     chain = None
                     for chunkdata in iter(lambda: self.deltachunk(chain), {}):
                         # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
                         yield chunkdata
                         chain = chunkdata[0]
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = deltaheader.size
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
             class cg3unpacker(cg2unpacker):
                 """Unpacker for cg3 streams.
                 cg3 streams add support for exchanging treemanifests and revlog
                 flags. It adds the revlog flags to the delta header and an empty chunk
                 separating manifests and files.
                 """
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 deltaheadersize = deltaheader.size
                 version = '03'
                 _grouplistcount = 2 # One list of manifests and one list of files
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs, flags = headertuple
                     return node, p1, p2, deltabase, cs, flags
                 def _unpackmanifests(self, repo, revmap, trp, prog):
                     super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
                     for chunkdata in iter(self.filelogheader, {}):
                         # If we get here, there are directory manifests in the changegroup
                         d = chunkdata["filename"]
                         repo.ui.debug("adding %s revisions\n" % d)
                         dirlog = repo.manifestlog._revlog.dirlog(d)
                         deltas = self.deltaiter()
                         if not dirlog.addgroup(deltas, revmap, trp):
                             raise error.Abort(_("received dir revlog group is empty"))
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             @attr.s(slots=True, frozen=True)
             class revisiondelta(object):
                 """Describes a delta entry in a changegroup.
                 Captured data is sufficient to serialize the delta into multiple
                 formats.
                 """
                 # 20 byte node of this revision.
                 node = attr.ib()
                 # 20 byte nodes of parent revisions.
                 p1node = attr.ib()
                 p2node = attr.ib()
                 # 20 byte node of node this delta is against.
                 basenode = attr.ib()
                 # 20 byte node of changeset revision this delta is associated with.
                 linknode = attr.ib()
                 # 2 bytes of flags to apply to revision data.
                 flags = attr.ib()
                 # Iterable of chunks holding raw delta data.
                 deltachunks = attr.ib()
             class cgpacker(object):
                 def __init__(self, repo, filematcher, version, allowreorder,
                              useprevdelta, builddeltaheader, manifestsend,
-                             sendtreemanifests, bundlecaps=None, shallow=False):
+                             sendtreemanifests, bundlecaps=None, shallow=False,
+                             ellipsisroots=None):
                     """Given a source repo, construct a bundler.
                     filematcher is a matcher that matches on files to include in the
                     changegroup. Used to facilitate sparse changegroups.
                     allowreorder controls whether reordering of revisions is allowed.
                     This value is used when ``bundle.reorder`` is ``auto`` or isn't
                     set.
                     useprevdelta controls whether revisions should always delta against
                     the previous revision in the changegroup.
                     builddeltaheader is a callable that constructs the header for a group
                     delta.
                     manifestsend is a chunk to send after manifests have been fully emitted.
                     sendtreemanifests indicates whether tree manifests should be emitted.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle. While bundlecaps is
                     unused in core Mercurial, extensions rely on this feature to communicate
                     capabilities to customize the changegroup packer.
                     shallow indicates whether shallow data might be sent. The packer may
                     need to pack file contents not introduced by the changes being packed.
                     """
                     assert filematcher
                     self._filematcher = filematcher
                     self.version = version
                     self._useprevdelta = useprevdelta
                     self._builddeltaheader = builddeltaheader
                     self._manifestsend = manifestsend
                     self._sendtreemanifests = sendtreemanifests
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     self._isshallow = shallow
+                    # Maps ellipsis revs to their roots at the changelog level.
+                    self._precomputedellipsis = ellipsisroots
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder')
                     if reorder == 'auto':
                         self._reorder = allowreorder
                     else:
                         self._reorder = stringutil.parsebool(reorder)
                     self._repo = repo
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                     # TODO the functionality keyed off of this should probably be
                     # controlled via arguments to group() that influence behavior.
                     self._changelogdone = False
                     # Maps CL revs to per-revlog revisions. Cleared in close() at
                     # the end of each group.
                     self._clrevtolocalrev = {}
                     self._nextclrevtolocalrev = {}
                     # Maps changelog nodes to changelog revs. Filled in once
                     # during changelog stage and then left unmodified.
                     self._clnodetorev = {}
                 def _close(self):
                     # Ellipses serving mode.
                     self._clrevtolocalrev.clear()
                     if self._nextclrevtolocalrev:
                         self.clrevtolocalrev = self._nextclrevtolocalrev
                         self._nextclrevtolocalrev.clear()
                     self._changelogdone = True
                     return closechunk()
                 def _fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 # Extracted both for clarity and for overriding in extensions.
                 def _sortgroup(self, store, nodelist, lookup):
                     """Sort nodes for change group and turn them into revnums."""
                     # Ellipses serving mode.
                     #
                     # In a perfect world, we'd generate better ellipsis-ified graphs
                     # for non-changelog revlogs. In practice, we haven't started doing
                     # that yet, so the resulting DAGs for the manifestlog and filelogs
                     # are actually full of bogus parentage on all the ellipsis
                     # nodes. This has the side effect that, while the contents are
                     # correct, the individual DAGs might be completely out of whack in
                     # a case like 882681bc3166 and its ancestors (back about 10
                     # revisions or so) in the main hg repo.
                     #
                     # The one invariant we *know* holds is that the new (potentially
                     # bogus) DAG shape will be valid if we order the nodes in the
                     # order that they're introduced in dramatis personae by the
                     # changelog, so what we do is we sort the non-changelog histories
                     # by the order in which they are used by the changelog.
                     if util.safehasattr(self, '_full_nodes') and self._clnodetorev:
                         key = lambda n: self._clnodetorev[lookup(n)]
                         return [store.rev(n) for n in sorted(nodelist, key=key)]
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (store._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(store)
                         return dag.linearize(set(store.rev(n) for n in nodelist))
                     else:
                         return sorted([store.rev(n) for n in nodelist])
                 def group(self, nodelist, store, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self._close()
                         return
                     revs = self._sortgroup(store, nodelist, lookup)
                     # add the parent of the first rev
                     p = store.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     progress = None
                     if units is not None:
                         progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
                                                               total=(len(revs) - 1))
                     for r in pycompat.xrange(len(revs) - 1):
                         if progress:
                             progress.update(r + 1)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(store.node(curr))
                         for c in self._revchunk(store, curr, prev, linknode):
                             yield c
                     if progress:
                         progress.complete()
                     yield self._close()
                 # filter any nodes that claim to be part of the known set
                 def _prune(self, store, missing, commonrevs):
                     # TODO this violates storage abstraction for manifests.
                     if isinstance(store, manifest.manifestrevlog):
                         if not self._filematcher.visitdir(store._dir[:-1] or '.'):
                             return []
                     rr, rl = store.rev, store.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def _packmanifests(self, dir, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
                     assert not dir
                     for chunk in self.group(mfnodes, self._repo.manifestlog._revlog,
                                             lookuplinknode, units=_('manifests')):
                         yield chunk
                 def _packtreemanifests(self, dir, mfnodes, lookuplinknode):
                     """Version of _packmanifests that operates on directory manifests.
                     Encodes the directory name in the output so multiple manifests
                     can be sent.
                     """
                     assert self.version == b'03'
                     if dir:
                         yield self._fileheader(dir)
                     # TODO violates storage abstractions by assuming revlogs.
                     dirlog = self._repo.manifestlog._revlog.dirlog(dir)
                     for chunk in self.group(mfnodes, dirlog, lookuplinknode,
                                             units=_('manifests')):
                         yield chunk
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     mfl = repo.manifestlog
                     # TODO violates storage abstraction.
                     mfrevlog = mfl._revlog
                     changedfiles = set()
                     ellipsesmode = util.safehasattr(self, '_full_nodes')
                     # Callback for the changelog, used to collect changed files and
                     # manifest nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         if ellipsesmode:
                             # Only update mfs if x is going to be sent. Otherwise we
                             # end up with bogus linkrevs specified for manifests and
                             # we skip some manifest nodes that we should otherwise
                             # have sent.
                             if (x in self._full_nodes
-                                or cl.rev(x) in self._precomputed_ellipsis):
+                                or cl.rev(x) in self._precomputedellipsis):
                                 n = c[0]
                                 # Record the first changeset introducing this manifest
                                 # version.
                                 mfs.setdefault(n, x)
                                 # Set this narrow-specific dict so we have the lowest
                                 # manifest revnum to look up for this cl revnum. (Part of
                                 # mapping changelog ellipsis parents to manifest ellipsis
                                 # parents)
                                 self._nextclrevtolocalrev.setdefault(cl.rev(x),
                                                                      mfrevlog.rev(n))
                             # We can't trust the changed files list in the changeset if the
                             # client requested a shallow clone.
                             if self._isshallow:
                                 changedfiles.update(mfl[c[0]].read().keys())
                             else:
                                 changedfiles.update(c[3])
                         else:
                             n = c[0]
                             # record the first changeset introducing this manifest version
                             mfs.setdefault(n, x)
                             # Record a complete list of potentially-changed files in
                             # this manifest.
                             changedfiles.update(c[3])
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Treemanifests don't work correctly with fastpathlinkrev
                     # either, because we don't discover which directory nodes to
                     # send along with files. This could probably be fixed.
                     fastpathlinkrev = fastpathlinkrev and (
                         'treemanifest' not in repo.requirements)
                     for chunk in self.generatemanifests(commonrevs, clrevorder,
                             fastpathlinkrev, mfs, fnodes, source):
                         yield chunk
                     if ellipsesmode:
                         mfdicts = None
                         if self._isshallow:
                             mfdicts = [(self._repo.manifestlog[n].read(), lr)
                                        for (n, lr) in mfs.iteritems()]
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     if not fastpathlinkrev:
                         def linknodes(unused, fname):
                             return fnodes.get(fname, {})
                     else:
                         cln = cl.node
                         def linknodes(filerevlog, fname):
                             llr = filerevlog.linkrev
                             fln = filerevlog.node
                             revs = ((r, llr(r)) for r in filerevlog)
                             return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
                     if ellipsesmode:
                         # We need to pass the mfdicts variable down into
                         # generatefiles(), but more than one command might have
                         # wrapped generatefiles so we can't modify the function
                         # signature. Instead, we pass the data to ourselves using an
                         # instance attribute. I'm sorry.
                         self._mfdicts = mfdicts
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self._close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
                                       fnodes, source):
                     """Returns an iterator of changegroup chunks containing manifests.
                     `source` is unused here, but is used by extensions like remotefilelog to
                     change what is sent based in pulls vs pushes, etc.
                     """
                     repo = self._repo
                     mfl = repo.manifestlog
                     dirlog = mfl._revlog.dirlog
                     tmfnodes = {'': mfs}
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def makelookupmflinknode(dir, nodes):
                         if fastpathlinkrev:
                             assert not dir
                             return mfs.__getitem__
                         def lookupmflinknode(x):
                             """Callback for looking up the linknode for manifests.
                             Returns the linkrev node for the specified manifest.
                             SIDE EFFECT:
 ) fclnodes gets populated with the list of relevant
                                file nodes if we're not using fastpathlinkrev
 ) When treemanifests are in use, collects treemanifest nodes
                                to send
                             Note that this means manifests must be completely sent to
                             the client before you can trust the list of files and
                             treemanifests to send.
                             """
                             clnode = nodes[x]
                             mdata = mfl.get(dir, x).readfast(shallow=True)
                             for p, n, fl in mdata.iterentries():
                                 if fl == 't': # subdirectory manifest
                                     subdir = dir + p + '/'
                                     tmfclnodes = tmfnodes.setdefault(subdir, {})
                                     tmfclnode = tmfclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[tmfclnode]:
                                         tmfclnodes[n] = clnode
                                 else:
                                     f = dir + p
                                     fclnodes = fnodes.setdefault(f, {})
                                     fclnode = fclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[fclnode]:
                                         fclnodes[n] = clnode
                             return clnode
                         return lookupmflinknode
                     fn = (self._packtreemanifests if self._sendtreemanifests
                           else self._packmanifests)
                     size = 0
                     while tmfnodes:
                         dir, nodes = tmfnodes.popitem()
                         prunednodes = self._prune(dirlog(dir), nodes, commonrevs)
                         if not dir or prunednodes:
                             for x in fn(dir, prunednodes, makelookupmflinknode(dir, nodes)):
                                 size += len(x)
                                 yield x
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                     yield self._manifestsend
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     changedfiles = list(filter(self._filematcher, changedfiles))
                     if self._isshallow:
                         # See comment in generate() for why this sadness is a thing.
                         mfdicts = self._mfdicts
                         del self._mfdicts
                         # In a shallow clone, the linknodes callback needs to also include
                         # those file nodes that are in the manifests we sent but weren't
                         # introduced by those manifests.
                         commonctxs = [self._repo[c] for c in commonrevs]
                         oldlinknodes = linknodes
                         clrev = self._repo.changelog.rev
                         # Defining this function has a side-effect of overriding the
                         # function of the same name that was passed in as an argument.
                         # TODO have caller pass in appropriate function.
                         def linknodes(flog, fname):
                             for c in commonctxs:
                                 try:
                                     fnode = c.filenode(fname)
                                     self._clrevtolocalrev[c.rev()] = flog.rev(fnode)
                                 except error.ManifestLookupError:
                                     pass
                             links = oldlinknodes(flog, fname)
                             if len(links) != len(mfdicts):
                                 for mf, lr in mfdicts:
                                     fnode = mf.get(fname, None)
                                     if fnode in links:
                                         links[fnode] = min(links[fnode], lr, key=clrev)
                                     elif fnode:
                                         links[fnode] = lr
                             return links
                     return self._generatefiles(changedfiles, linknodes, commonrevs, source)
                 def _generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
                                                     total=len(changedfiles))
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing file data for %s") %
                                               fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress.update(i + 1, item=fname)
                             h = self._fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress.complete()
                 def _deltaparent(self, store, rev, p1, p2, prev):
                     if self._useprevdelta:
                         if not store.candelta(prev, rev):
                             raise error.ProgrammingError(
                                 'cg1 should not be used in this case')
                         return prev
                     # Narrow ellipses mode.
                     if util.safehasattr(self, '_full_nodes'):
                         # TODO: send better deltas when in narrow mode.
                         #
                         # changegroup.group() loops over revisions to send,
                         # including revisions we'll skip. What this means is that
                         # `prev` will be a potentially useless delta base for all
                         # ellipsis nodes, as the client likely won't have it. In
                         # the future we should do bookkeeping about which nodes
                         # have been sent to the client, and try to be
                         # significantly smarter about delta bases. This is
                         # slightly tricky because this same code has to work for
                         # all revlogs, and we don't have the linkrev/linknode here.
                         return p1
                     dp = store.deltaparent(rev)
                     if dp == nullrev and store.storedeltachains:
                         # Avoid sending full revisions when delta parent is null. Pick prev
                         # in that case. It's tempting to pick p1 in this case, as p1 will
                         # be smaller in the common case. However, computing a delta against
                         # p1 may require resolving the raw text of p1, which could be
                         # expensive. The revlog caches should have prev cached, meaning
                         # less CPU for changegroup generation. There is likely room to add
                         # a flag and/or config option to control this behavior.
                         base = prev
                     elif dp == nullrev:
                         # revlog is configured to use full snapshot for a reason,
                         # stick to full snapshot.
                         base = nullrev
                     elif dp not in (p1, p2, prev):
                         # Pick prev when we can't be sure remote has the base revision.
                         return prev
                     else:
                         base = dp
                     if base != nullrev and not store.candelta(base, rev):
                         base = nullrev
                     return base
                 def _revchunk(self, store, rev, prev, linknode):
                     if util.safehasattr(self, '_full_nodes'):
                         fn = self._revisiondeltanarrow
                     else:
                         fn = self._revisiondeltanormal
                     delta = fn(store, rev, prev, linknode)
                     if not delta:
                         return
                     meta = self._builddeltaheader(delta)
                     l = len(meta) + sum(len(x) for x in delta.deltachunks)
                     yield chunkheader(l)
                     yield meta
                     for x in delta.deltachunks:
                         yield x
                 def _revisiondeltanormal(self, store, rev, prev, linknode):
                     node = store.node(rev)
                     p1, p2 = store.parentrevs(rev)
                     base = self._deltaparent(store, rev, p1, p2, prev)
                     prefix = ''
                     if store.iscensored(base) or store.iscensored(rev):
                         try:
                             delta = store.revision(node, raw=True)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = store.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = store.revision(node, raw=True)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = store.revdiff(base, rev)
                     p1n, p2n = store.parents(node)
                     return revisiondelta(
                         node=node,
                         p1node=p1n,
                         p2node=p2n,
                         basenode=store.node(base),
                         linknode=linknode,
                         flags=store.flags(rev),
                         deltachunks=(prefix, delta),
                     )
                 def _revisiondeltanarrow(self, store, rev, prev, linknode):
                     # build up some mapping information that's useful later. See
                     # the local() nested function below.
                     if not self._changelogdone:
                         self._clnodetorev[linknode] = rev
                         linkrev = rev
                         self._clrevtolocalrev[linkrev] = rev
                     else:
                         linkrev = self._clnodetorev[linknode]
                         self._clrevtolocalrev[linkrev] = rev
                     # This is a node to send in full, because the changeset it
                     # corresponds to was a full changeset.
                     if linknode in self._full_nodes:
                         return self._revisiondeltanormal(store, rev, prev, linknode)
                     # At this point, a node can either be one we should skip or an
                     # ellipsis. If it's not an ellipsis, bail immediately.
-                    if linkrev not in self._precomputed_ellipsis:
+                    if linkrev not in self._precomputedellipsis:
                         return
-                    linkparents = self._precomputed_ellipsis[linkrev]
+                    linkparents = self._precomputedellipsis[linkrev]
                     def local(clrev):
                         """Turn a changelog revnum into a local revnum.
                         The ellipsis dag is stored as revnums on the changelog,
                         but when we're producing ellipsis entries for
                         non-changelog revlogs, we need to turn those numbers into
                         something local. This does that for us, and during the
                         changelog sending phase will also expand the stored
                         mappings as needed.
                         """
                         if clrev == nullrev:
                             return nullrev
                         if not self._changelogdone:
                             # If we're doing the changelog, it's possible that we
                             # have a parent that is already on the client, and we
                             # need to store some extra mapping information so that
                             # our contained ellipsis nodes will be able to resolve
                             # their parents.
                             if clrev not in self._clrevtolocalrev:
                                 clnode = store.node(clrev)
                                 self._clnodetorev[clnode] = clrev
                             return clrev
                         # Walk the ellipsis-ized changelog breadth-first looking for a
                         # change that has been linked from the current revlog.
                         #
                         # For a flat manifest revlog only a single step should be necessary
                         # as all relevant changelog entries are relevant to the flat
                         # manifest.
                         #
                         # For a filelog or tree manifest dirlog however not every changelog
                         # entry will have been relevant, so we need to skip some changelog
                         # nodes even after ellipsis-izing.
                         walk = [clrev]
                         while walk:
                             p = walk[0]
                             walk = walk[1:]
                             if p in self._clrevtolocalrev:
                                 return self._clrevtolocalrev[p]
                             elif p in self._full_nodes:
                                 walk.extend([pp for pp in self._repo.changelog.parentrevs(p)
                                                 if pp != nullrev])
-                            elif p in self._precomputed_ellipsis:
+                            elif p in self._precomputedellipsis:
-                                walk.extend([pp for pp in self._precomputed_ellipsis[p]
+                                walk.extend([pp for pp in self._precomputedellipsis[p]
                                                 if pp != nullrev])
                             else:
                                 # In this case, we've got an ellipsis with parents
                                 # outside the current bundle (likely an
                                 # incremental pull). We "know" that we can use the
                                 # value of this same revlog at whatever revision
                                 # is pointed to by linknode. "Know" is in scare
                                 # quotes because I haven't done enough examination
                                 # of edge cases to convince myself this is really
                                 # a fact - it works for all the (admittedly
                                 # thorough) cases in our testsuite, but I would be
                                 # somewhat unsurprised to find a case in the wild
                                 # where this breaks down a bit. That said, I don't
                                 # know if it would hurt anything.
                                 for i in pycompat.xrange(rev, 0, -1):
                                     if store.linkrev(i) == clrev:
                                         return i
                                 # We failed to resolve a parent for this node, so
                                 # we crash the changegroup construction.
                                 raise error.Abort(
                                     'unable to resolve parent while packing %r %r'
                                     ' for changeset %r' % (store.indexfile, rev, clrev))
                         return nullrev
                     if not linkparents or (
                         store.parentrevs(rev) == (nullrev, nullrev)):
                         p1, p2 = nullrev, nullrev
                     elif len(linkparents) == 1:
                         p1, = sorted(local(p) for p in linkparents)
                         p2 = nullrev
                     else:
                         p1, p2 = sorted(local(p) for p in linkparents)
                     n = store.node(rev)
                     p1n, p2n = store.node(p1), store.node(p2)
                     flags = store.flags(rev)
                     flags |= revlog.REVIDX_ELLIPSIS
                     # TODO: try and actually send deltas for ellipsis data blocks
                     data = store.revision(n)
                     diffheader = mdiff.trivialdiffheader(len(data))
                     return revisiondelta(
                         node=n,
                         p1node=p1n,
                         p2node=p2n,
                         basenode=nullid,
                         linknode=linknode,
                         flags=flags,
                         deltachunks=(diffheader, data),
                     )
-            def _makecg1packer(repo, filematcher, bundlecaps, shallow=False):
+            def _makecg1packer(repo, filematcher, bundlecaps, shallow=False,
+                               ellipsisroots=None):
                 builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(
                     d.node, d.p1node, d.p2node, d.linknode)
                 return cgpacker(repo, filematcher, b'01',
                                 useprevdelta=True,
                                 allowreorder=None,
                                 builddeltaheader=builddeltaheader,
                                 manifestsend=b'',
                                 sendtreemanifests=False,
                                 bundlecaps=bundlecaps,
-                                shallow=shallow)
+                                shallow=shallow,
+                                ellipsisroots=ellipsisroots)
-            def _makecg2packer(repo, filematcher, bundlecaps, shallow=False):
+            def _makecg2packer(repo, filematcher, bundlecaps, shallow=False,
+                               ellipsisroots=None):
                 builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(
                     d.node, d.p1node, d.p2node, d.basenode, d.linknode)
                 # Since generaldelta is directly supported by cg2, reordering
                 # generally doesn't help, so we disable it by default (treating
                 # bundle.reorder=auto just like bundle.reorder=False).
                 return cgpacker(repo, filematcher, b'02',
                                 useprevdelta=False,
                                 allowreorder=False,
                                 builddeltaheader=builddeltaheader,
                                 manifestsend=b'',
                                 sendtreemanifests=False,
                                 bundlecaps=bundlecaps,
-                                shallow=shallow)
+                                shallow=shallow,
+                                ellipsisroots=ellipsisroots)
-            def _makecg3packer(repo, filematcher, bundlecaps, shallow=False):
+            def _makecg3packer(repo, filematcher, bundlecaps, shallow=False,
+                               ellipsisroots=None):
                 builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(
                     d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)
                 return cgpacker(repo, filematcher, b'03',
                                 useprevdelta=False,
                                 allowreorder=False,
                                 builddeltaheader=builddeltaheader,
                                 manifestsend=closechunk(),
                                 sendtreemanifests=True,
                                 bundlecaps=bundlecaps,
-                                shallow=shallow)
+                                shallow=shallow,
+                                ellipsisroots=ellipsisroots)
             _packermap = {'01': (_makecg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (_makecg2packer, cg2unpacker),
                          # cg3 adds support for exchanging revlog flags and treemanifests
                          '03': (_makecg3packer, cg3unpacker),
             }
             def allsupportedversions(repo):
                 versions = set(_packermap.keys())
                 if not (repo.ui.configbool('experimental', 'changegroup3') or
                         repo.ui.configbool('experimental', 'treemanifest') or
                         'treemanifest' in repo.requirements):
                     versions.discard('03')
                 return versions
             # Changegroup versions that can be applied to the repo
             def supportedincomingversions(repo):
                 return allsupportedversions(repo)
             # Changegroup versions that can be created from the repo
             def supportedoutgoingversions(repo):
                 versions = allsupportedversions(repo)
                 if 'treemanifest' in repo.requirements:
                     # Versions 01 and 02 support only flat manifests and it's just too
                     # expensive to convert between the flat manifest and tree manifest on
                     # the fly. Since tree manifests are hashed differently, all of history
                     # would have to be converted. Instead, we simply don't even pretend to
                     # support versions 01 and 02.
                     versions.discard('01')
                     versions.discard('02')
                 if repository.NARROW_REQUIREMENT in repo.requirements:
                     # Versions 01 and 02 don't support revlog flags, and we need to
                     # support that for stripping and unbundling to work.
                     versions.discard('01')
                     versions.discard('02')
                 if LFS_REQUIREMENT in repo.requirements:
                     # Versions 01 and 02 don't support revlog flags, and we need to
                     # mark LFS entries with REVIDX_EXTSTORED.
                     versions.discard('01')
                     versions.discard('02')
                 return versions
             def localversion(repo):
                 # Finds the best version to use for bundles that are meant to be used
                 # locally, such as those from strip and shelve, and temporary bundles.
                 return max(supportedoutgoingversions(repo))
             def safeversion(repo):
                 # Finds the smallest version that it's safe to assume clients of the repo
                 # will support. For example, all hg versions that support generaldelta also
                 # support changegroup 02.
                 versions = supportedoutgoingversions(repo)
                 if 'generaldelta' in repo.requirements:
                     versions.discard('01')
                 assert versions
                 return min(versions)
             def getbundler(version, repo, bundlecaps=None, filematcher=None,
-                           shallow=False):
+                           shallow=False, ellipsisroots=None):
                 assert version in supportedoutgoingversions(repo)
                 if filematcher is None:
                     filematcher = matchmod.alwaysmatcher(repo.root, '')
                 if version == '01' and not filematcher.always():
                     raise error.ProgrammingError('version 01 changegroups do not support '
                                                  'sparse file matchers')
                 # Requested files could include files not in the local store. So
                 # filter those out.
                 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
                                                          filematcher)
                 fn = _packermap[version][0]
-                return fn(repo, filematcher, bundlecaps, shallow=shallow)
+                return fn(repo, filematcher, bundlecaps, shallow=shallow,
+                          ellipsisroots=ellipsisroots)
             def getunbundler(version, fh, alg, extras=None):
                 return _packermap[version][1](fh, alg, extras=extras)
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def makechangegroup(repo, outgoing, version, source, fastpath=False,
                                 bundlecaps=None):
                 cgstream = makestream(repo, outgoing, version, source,
                                       fastpath=fastpath, bundlecaps=bundlecaps)
                 return getunbundler(version, util.chunkbuffer(cgstream), None,
                                     {'clcount': len(outgoing.missing) })
             def makestream(repo, outgoing, version, source, fastpath=False,
                            bundlecaps=None, filematcher=None):
                 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
                                      filematcher=filematcher)
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
                 revisions = 0
                 files = 0
                 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
                                                 total=expectedfiles)
                 for chunkdata in iter(source.filelogheader, {}):
                     files += 1
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     progress.increment()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         deltas = source.deltaiter()
                         if not fl.addgroup(deltas, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in pycompat.xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 progress.complete()
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files
             def _packellipsischangegroup(repo, common, match, relevant_nodes,
                                          ellipsisroots, visitnodes, depth, source, version):
                 if version in ('01', '02'):
                     raise error.Abort(
                         'ellipsis nodes require at least cg3 on client and server, '
                         'but negotiated version %s' % version)
                 # We wrap cg1packer.revchunk, using a side channel to pass
                 # relevant_nodes into that area. Then if linknode isn't in the
                 # set, we know we have an ellipsis node and we should defer
                 # sending that node's data. We override close() to detect
                 # pending ellipsis nodes and flush them.
                 packer = getbundler(version, repo, filematcher=match,
-                                    shallow=depth is not None)
+                                    shallow=depth is not None,
+                                    ellipsisroots=ellipsisroots)
                 # Give the packer the list of nodes which should not be
                 # ellipsis nodes. We store this rather than the set of nodes
                 # that should be an ellipsis because for very large histories
                 # we expect this to be significantly smaller.
                 packer._full_nodes = relevant_nodes
-                # Maps ellipsis revs to their roots at the changelog level.
-                packer._precomputed_ellipsis = ellipsisroots
                 return packer.generate(common, visitnodes, False, source)