upstream/mercurial-mirror Commit - r39018:037debbf

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import weakref

12

import weakref

13

14

from .i18n import _

14

from .i18n import _

15

from .node import (

15

from .node import (

16

hex,

16

hex,

17

nullid,

17

nullid,

18

nullrev,

18

nullrev,

19

short,

19

short,

20

)

20

)

21

22

from .thirdparty import (

22

from .thirdparty import (

23

attr,

23

attr,

24

)

24

)

25

26

from . import (

26

from . import (

27

dagutil,

27

dagutil,

28

error,

28

error,

29

manifest,

29

manifest,

30

match as matchmod,

30

match as matchmod,

31

mdiff,

31

mdiff,

32

phases,

32

phases,

33

pycompat,

33

pycompat,

34

repository,

34

repository,

35

revlog,

35

revlog,

36

util,

36

util,

37

)

37

)

38

39

from .utils import (

39

from .utils import (

40

stringutil,

40

stringutil,

41

)

41

)

42

43

_CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")

43

_CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")

44

_CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")

44

_CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")

45

_CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")

45

_CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")

46

47

LFS_REQUIREMENT = 'lfs'

47

LFS_REQUIREMENT = 'lfs'

48

49

readexactly = util.readexactly

49

readexactly = util.readexactly

50

51

def getchunk(stream):

51

def getchunk(stream):

52

"""return the next chunk from stream as a string"""

52

"""return the next chunk from stream as a string"""

53

d = readexactly(stream, 4)

53

d = readexactly(stream, 4)

54

l = struct.unpack(">l", d)[0]

54

l = struct.unpack(">l", d)[0]

55

if l <= 4:

55

if l <= 4:

56

if l:

56

if l:

57

raise error.Abort(_("invalid chunk length %d") % l)

57

raise error.Abort(_("invalid chunk length %d") % l)

58

return ""

58

return ""

59

return readexactly(stream, l - 4)

59

return readexactly(stream, l - 4)

60

61

def chunkheader(length):

61

def chunkheader(length):

62

"""return a changegroup chunk header (string)"""

62

"""return a changegroup chunk header (string)"""

63

return struct.pack(">l", length + 4)

63

return struct.pack(">l", length + 4)

64

65

def closechunk():

65

def closechunk():

66

"""return a changegroup chunk header (string) for a zero-length chunk"""

66

"""return a changegroup chunk header (string) for a zero-length chunk"""

67

return struct.pack(">l", 0)

67

return struct.pack(">l", 0)

68

69

def _fileheader(path):

69

def _fileheader(path):

70

"""Obtain a changegroup chunk header for a named path."""

70

"""Obtain a changegroup chunk header for a named path."""

71

return chunkheader(len(path)) + path

71

return chunkheader(len(path)) + path

72

73

def writechunks(ui, chunks, filename, vfs=None):

73

def writechunks(ui, chunks, filename, vfs=None):

74

"""Write chunks to a file and return its filename.

74

"""Write chunks to a file and return its filename.

75

76

The stream is assumed to be a bundle file.

76

The stream is assumed to be a bundle file.

77

Existing files will not be overwritten.

77

Existing files will not be overwritten.

78

If no filename is specified, a temporary file is created.

78

If no filename is specified, a temporary file is created.

79

"""

79

"""

80

fh = None

80

fh = None

81

cleanup = None

81

cleanup = None

82

try:

82

try:

83

if filename:

83

if filename:

84

if vfs:

84

if vfs:

85

fh = vfs.open(filename, "wb")

85

fh = vfs.open(filename, "wb")

86

else:

86

else:

87

# Increase default buffer size because default is usually

87

# Increase default buffer size because default is usually

88

# small (4k is common on Linux).

88

# small (4k is common on Linux).

89

fh = open(filename, "wb", 131072)

89

fh = open(filename, "wb", 131072)

90

else:

90

else:

91

fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")

91

fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")

92

fh = os.fdopen(fd, r"wb")

92

fh = os.fdopen(fd, r"wb")

93

cleanup = filename

93

cleanup = filename

94

for c in chunks:

94

for c in chunks:

95

fh.write(c)

95

fh.write(c)

96

cleanup = None

96

cleanup = None

97

return filename

97

return filename

98

finally:

98

finally:

99

if fh is not None:

99

if fh is not None:

100

fh.close()

100

fh.close()

101

if cleanup is not None:

101

if cleanup is not None:

102

if filename and vfs:

102

if filename and vfs:

103

vfs.unlink(cleanup)

103

vfs.unlink(cleanup)

104

else:

104

else:

105

os.unlink(cleanup)

105

os.unlink(cleanup)

106

107

class cg1unpacker(object):

107

class cg1unpacker(object):

108

"""Unpacker for cg1 changegroup streams.

108

"""Unpacker for cg1 changegroup streams.

109

110

A changegroup unpacker handles the framing of the revision data in

110

A changegroup unpacker handles the framing of the revision data in

111

the wire format. Most consumers will want to use the apply()

111

the wire format. Most consumers will want to use the apply()

112

method to add the changes from the changegroup to a repository.

112

method to add the changes from the changegroup to a repository.

113

114

If you're forwarding a changegroup unmodified to another consumer,

114

If you're forwarding a changegroup unmodified to another consumer,

115

use getchunks(), which returns an iterator of changegroup

115

use getchunks(), which returns an iterator of changegroup

116

chunks. This is mostly useful for cases where you need to know the

116

chunks. This is mostly useful for cases where you need to know the

117

data stream has ended by observing the end of the changegroup.

117

data stream has ended by observing the end of the changegroup.

118

119

deltachunk() is useful only if you're applying delta data. Most

119

deltachunk() is useful only if you're applying delta data. Most

120

consumers should prefer apply() instead.

120

consumers should prefer apply() instead.

121

122

A few other public methods exist. Those are used only for

122

A few other public methods exist. Those are used only for

123

bundlerepo and some debug commands - their use is discouraged.

123

bundlerepo and some debug commands - their use is discouraged.

124

"""

124

"""

125

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

125

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

126

deltaheadersize = deltaheader.size

126

deltaheadersize = deltaheader.size

127

version = '01'

127

version = '01'

128

_grouplistcount = 1 # One list of files after the manifests

128

_grouplistcount = 1 # One list of files after the manifests

129

130

def __init__(self, fh, alg, extras=None):

130

def __init__(self, fh, alg, extras=None):

131

if alg is None:

131

if alg is None:

132

alg = 'UN'

132

alg = 'UN'

133

if alg not in util.compengines.supportedbundletypes:

133

if alg not in util.compengines.supportedbundletypes:

134

raise error.Abort(_('unknown stream compression type: %s')

134

raise error.Abort(_('unknown stream compression type: %s')

135

% alg)

135

% alg)

136

if alg == 'BZ':

136

if alg == 'BZ':

137

alg = '_truncatedBZ'

137

alg = '_truncatedBZ'

138

139

compengine = util.compengines.forbundletype(alg)

139

compengine = util.compengines.forbundletype(alg)

140

self._stream = compengine.decompressorreader(fh)

140

self._stream = compengine.decompressorreader(fh)

141

self._type = alg

141

self._type = alg

142

self.extras = extras or {}

142

self.extras = extras or {}

143

self.callback = None

143

self.callback = None

144

145

# These methods (compressed, read, seek, tell) all appear to only

145

# These methods (compressed, read, seek, tell) all appear to only

146

# be used by bundlerepo, but it's a little hard to tell.

146

# be used by bundlerepo, but it's a little hard to tell.

147

def compressed(self):

147

def compressed(self):

148

return self._type is not None and self._type != 'UN'

148

return self._type is not None and self._type != 'UN'

149

def read(self, l):

149

def read(self, l):

150

return self._stream.read(l)

150

return self._stream.read(l)

151

def seek(self, pos):

151

def seek(self, pos):

152

return self._stream.seek(pos)

152

return self._stream.seek(pos)

153

def tell(self):

153

def tell(self):

154

return self._stream.tell()

154

return self._stream.tell()

155

def close(self):

155

def close(self):

156

return self._stream.close()

156

return self._stream.close()

157

158

def _chunklength(self):

158

def _chunklength(self):

159

d = readexactly(self._stream, 4)

159

d = readexactly(self._stream, 4)

160

l = struct.unpack(">l", d)[0]

160

l = struct.unpack(">l", d)[0]

161

if l <= 4:

161

if l <= 4:

162

if l:

162

if l:

163

raise error.Abort(_("invalid chunk length %d") % l)

163

raise error.Abort(_("invalid chunk length %d") % l)

164

return 0

164

return 0

165

if self.callback:

165

if self.callback:

166

self.callback()

166

self.callback()

167

return l - 4

167

return l - 4

168

169

def changelogheader(self):

169

def changelogheader(self):

170

"""v10 does not have a changelog header chunk"""

170

"""v10 does not have a changelog header chunk"""

171

return {}

171

return {}

172

173

def manifestheader(self):

173

def manifestheader(self):

174

"""v10 does not have a manifest header chunk"""

174

"""v10 does not have a manifest header chunk"""

175

return {}

175

return {}

176

177

def filelogheader(self):

177

def filelogheader(self):

178

"""return the header of the filelogs chunk, v10 only has the filename"""

178

"""return the header of the filelogs chunk, v10 only has the filename"""

179

l = self._chunklength()

179

l = self._chunklength()

180

if not l:

180

if not l:

181

return {}

181

return {}

182

fname = readexactly(self._stream, l)

182

fname = readexactly(self._stream, l)

183

return {'filename': fname}

183

return {'filename': fname}

184

185

def _deltaheader(self, headertuple, prevnode):

185

def _deltaheader(self, headertuple, prevnode):

186

node, p1, p2, cs = headertuple

186

node, p1, p2, cs = headertuple

187

if prevnode is None:

187

if prevnode is None:

188

deltabase = p1

188

deltabase = p1

189

else:

189

else:

190

deltabase = prevnode

190

deltabase = prevnode

191

flags = 0

191

flags = 0

192

return node, p1, p2, deltabase, cs, flags

192

return node, p1, p2, deltabase, cs, flags

193

194

def deltachunk(self, prevnode):

194

def deltachunk(self, prevnode):

195

l = self._chunklength()

195

l = self._chunklength()

196

if not l:

196

if not l:

197

return {}

197

return {}

198

headerdata = readexactly(self._stream, self.deltaheadersize)

198

headerdata = readexactly(self._stream, self.deltaheadersize)

199

header = self.deltaheader.unpack(headerdata)

199

header = self.deltaheader.unpack(headerdata)

200

delta = readexactly(self._stream, l - self.deltaheadersize)

200

delta = readexactly(self._stream, l - self.deltaheadersize)

201

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

201

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

202

return (node, p1, p2, cs, deltabase, delta, flags)

202

return (node, p1, p2, cs, deltabase, delta, flags)

203

204

def getchunks(self):

204

def getchunks(self):

205

"""returns all the chunks contains in the bundle

205

"""returns all the chunks contains in the bundle

206

207

Used when you need to forward the binary stream to a file or another

207

Used when you need to forward the binary stream to a file or another

208

network API. To do so, it parse the changegroup data, otherwise it will

208

network API. To do so, it parse the changegroup data, otherwise it will

209

block in case of sshrepo because it don't know the end of the stream.

209

block in case of sshrepo because it don't know the end of the stream.

210

"""

210

"""

211

# For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,

211

# For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,

212

# and a list of filelogs. For changegroup 3, we expect 4 parts:

212

# and a list of filelogs. For changegroup 3, we expect 4 parts:

213

# changelog, manifestlog, a list of tree manifestlogs, and a list of

213

# changelog, manifestlog, a list of tree manifestlogs, and a list of

214

# filelogs.

214

# filelogs.

215

#

215

#

216

# Changelog and manifestlog parts are terminated with empty chunks. The

216

# Changelog and manifestlog parts are terminated with empty chunks. The

217

# tree and file parts are a list of entry sections. Each entry section

217

# tree and file parts are a list of entry sections. Each entry section

218

# is a series of chunks terminating in an empty chunk. The list of these

218

# is a series of chunks terminating in an empty chunk. The list of these

219

# entry sections is terminated in yet another empty chunk, so we know

219

# entry sections is terminated in yet another empty chunk, so we know

220

# we've reached the end of the tree/file list when we reach an empty

220

# we've reached the end of the tree/file list when we reach an empty

221

# chunk that was proceeded by no non-empty chunks.

221

# chunk that was proceeded by no non-empty chunks.

222

223

parts = 0

223

parts = 0

224

while parts < 2 + self._grouplistcount:

224

while parts < 2 + self._grouplistcount:

225

noentries = True

225

noentries = True

226

while True:

226

while True:

227

chunk = getchunk(self)

227

chunk = getchunk(self)

228

if not chunk:

228

if not chunk:

229

# The first two empty chunks represent the end of the

229

# The first two empty chunks represent the end of the

230

# changelog and the manifestlog portions. The remaining

230

# changelog and the manifestlog portions. The remaining

231

# empty chunks represent either A) the end of individual

231

# empty chunks represent either A) the end of individual

232

# tree or file entries in the file list, or B) the end of

232

# tree or file entries in the file list, or B) the end of

233

# the entire list. It's the end of the entire list if there

233

# the entire list. It's the end of the entire list if there

234

# were no entries (i.e. noentries is True).

234

# were no entries (i.e. noentries is True).

235

if parts < 2:

235

if parts < 2:

236

parts += 1

236

parts += 1

237

elif noentries:

237

elif noentries:

238

parts += 1

238

parts += 1

239

break

239

break

240

noentries = False

240

noentries = False

241

yield chunkheader(len(chunk))

241

yield chunkheader(len(chunk))

242

pos = 0

242

pos = 0

243

while pos < len(chunk):

243

while pos < len(chunk):

244

next = pos + 2**20

244

next = pos + 2**20

245

yield chunk[pos:next]

245

yield chunk[pos:next]

246

pos = next

246

pos = next

247

yield closechunk()

247

yield closechunk()

248

249

def _unpackmanifests(self, repo, revmap, trp, prog):

249

def _unpackmanifests(self, repo, revmap, trp, prog):

250

self.callback = prog.increment

250

self.callback = prog.increment

251

# no need to check for empty manifest group here:

251

# no need to check for empty manifest group here:

252

# if the result of the merge of 1 and 2 is the same in 3 and 4,

252

# if the result of the merge of 1 and 2 is the same in 3 and 4,

253

# no new manifest will be created and the manifest group will

253

# no new manifest will be created and the manifest group will

254

# be empty during the pull

254

# be empty during the pull

255

self.manifestheader()

255

self.manifestheader()

256

deltas = self.deltaiter()

256

deltas = self.deltaiter()

257

repo.manifestlog.addgroup(deltas, revmap, trp)

257

repo.manifestlog.addgroup(deltas, revmap, trp)

258

prog.complete()

258

prog.complete()

259

self.callback = None

259

self.callback = None

260

261

def apply(self, repo, tr, srctype, url, targetphase=phases.draft,

261

def apply(self, repo, tr, srctype, url, targetphase=phases.draft,

262

expectedtotal=None):

262

expectedtotal=None):

263

"""Add the changegroup returned by source.read() to this repo.

263

"""Add the changegroup returned by source.read() to this repo.

264

srctype is a string like 'push', 'pull', or 'unbundle'. url is

264

srctype is a string like 'push', 'pull', or 'unbundle'. url is

265

the URL of the repo where this changegroup is coming from.

265

the URL of the repo where this changegroup is coming from.

266

267

Return an integer summarizing the change to this repo:

267

Return an integer summarizing the change to this repo:

268

- nothing changed or no source: 0

268

- nothing changed or no source: 0

269

- more heads than before: 1+added heads (2..n)

269

- more heads than before: 1+added heads (2..n)

270

- fewer heads than before: -1-removed heads (-2..-n)

270

- fewer heads than before: -1-removed heads (-2..-n)

271

- number of heads stays the same: 1

271

- number of heads stays the same: 1

272

"""

272

"""

273

repo = repo.unfiltered()

273

repo = repo.unfiltered()

274

def csmap(x):

274

def csmap(x):

275

repo.ui.debug("add changeset %s\n" % short(x))

275

repo.ui.debug("add changeset %s\n" % short(x))

276

return len(cl)

276

return len(cl)

277

278

def revmap(x):

278

def revmap(x):

279

return cl.rev(x)

279

return cl.rev(x)

280

281

changesets = files = revisions = 0

281

changesets = files = revisions = 0

282

283

try:

283

try:

284

# The transaction may already carry source information. In this

284

# The transaction may already carry source information. In this

285

# case we use the top level data. We overwrite the argument

285

# case we use the top level data. We overwrite the argument

286

# because we need to use the top level value (if they exist)

286

# because we need to use the top level value (if they exist)

287

# in this function.

287

# in this function.

288

srctype = tr.hookargs.setdefault('source', srctype)

288

srctype = tr.hookargs.setdefault('source', srctype)

289

url = tr.hookargs.setdefault('url', url)

289

url = tr.hookargs.setdefault('url', url)

290

repo.hook('prechangegroup',

290

repo.hook('prechangegroup',

291

throw=True, **pycompat.strkwargs(tr.hookargs))

291

throw=True, **pycompat.strkwargs(tr.hookargs))

292

293

# write changelog data to temp files so concurrent readers

293

# write changelog data to temp files so concurrent readers

294

# will not see an inconsistent view

294

# will not see an inconsistent view

295

cl = repo.changelog

295

cl = repo.changelog

296

cl.delayupdate(tr)

296

cl.delayupdate(tr)

297

oldheads = set(cl.heads())

297

oldheads = set(cl.heads())

298

299

trp = weakref.proxy(tr)

299

trp = weakref.proxy(tr)

300

# pull off the changeset group

300

# pull off the changeset group

301

repo.ui.status(_("adding changesets\n"))

301

repo.ui.status(_("adding changesets\n"))

302

clstart = len(cl)

302

clstart = len(cl)

303

progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),

303

progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),

304

total=expectedtotal)

304

total=expectedtotal)

305

self.callback = progress.increment

305

self.callback = progress.increment

306

307

efiles = set()

307

efiles = set()

308

def onchangelog(cl, node):

308

def onchangelog(cl, node):

309

efiles.update(cl.readfiles(node))

309

efiles.update(cl.readfiles(node))

310

311

self.changelogheader()

311

self.changelogheader()

312

deltas = self.deltaiter()

312

deltas = self.deltaiter()

313

cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)

313

cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)

314

efiles = len(efiles)

314

efiles = len(efiles)

315

316

if not cgnodes:

316

if not cgnodes:

317

repo.ui.develwarn('applied empty changegroup',

317

repo.ui.develwarn('applied empty changegroup',

318

config='warn-empty-changegroup')

318

config='warn-empty-changegroup')

319

clend = len(cl)

319

clend = len(cl)

320

changesets = clend - clstart

320

changesets = clend - clstart

321

progress.complete()

321

progress.complete()

322

self.callback = None

322

self.callback = None

323

324

# pull off the manifest group

324

# pull off the manifest group

325

repo.ui.status(_("adding manifests\n"))

325

repo.ui.status(_("adding manifests\n"))

326

# We know that we'll never have more manifests than we had

326

# We know that we'll never have more manifests than we had

327

# changesets.

327

# changesets.

328

progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),

328

progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),

329

total=changesets)

329

total=changesets)

330

self._unpackmanifests(repo, revmap, trp, progress)

330

self._unpackmanifests(repo, revmap, trp, progress)

331

332

needfiles = {}

332

needfiles = {}

333

if repo.ui.configbool('server', 'validate'):

333

if repo.ui.configbool('server', 'validate'):

334

cl = repo.changelog

334

cl = repo.changelog

335

ml = repo.manifestlog

335

ml = repo.manifestlog

336

# validate incoming csets have their manifests

336

# validate incoming csets have their manifests

337

for cset in pycompat.xrange(clstart, clend):

337

for cset in pycompat.xrange(clstart, clend):

338

mfnode = cl.changelogrevision(cset).manifest

338

mfnode = cl.changelogrevision(cset).manifest

339

mfest = ml[mfnode].readdelta()

339

mfest = ml[mfnode].readdelta()

340

# store file cgnodes we must see

340

# store file cgnodes we must see

341

for f, n in mfest.iteritems():

341

for f, n in mfest.iteritems():

342

needfiles.setdefault(f, set()).add(n)

342

needfiles.setdefault(f, set()).add(n)

343

344

# process the files

344

# process the files

345

repo.ui.status(_("adding file changes\n"))

345

repo.ui.status(_("adding file changes\n"))

346

newrevs, newfiles = _addchangegroupfiles(

346

newrevs, newfiles = _addchangegroupfiles(

347

repo, self, revmap, trp, efiles, needfiles)

347

repo, self, revmap, trp, efiles, needfiles)

348

revisions += newrevs

348

revisions += newrevs

349

files += newfiles

349

files += newfiles

350

351

deltaheads = 0

351

deltaheads = 0

352

if oldheads:

352

if oldheads:

353

heads = cl.heads()

353

heads = cl.heads()

354

deltaheads = len(heads) - len(oldheads)

354

deltaheads = len(heads) - len(oldheads)

355

for h in heads:

355

for h in heads:

356

if h not in oldheads and repo[h].closesbranch():

356

if h not in oldheads and repo[h].closesbranch():

357

deltaheads -= 1

357

deltaheads -= 1

358

htext = ""

358

htext = ""

359

if deltaheads:

359

if deltaheads:

360

htext = _(" (%+d heads)") % deltaheads

360

htext = _(" (%+d heads)") % deltaheads

361

362

repo.ui.status(_("added %d changesets"

362

repo.ui.status(_("added %d changesets"

363

" with %d changes to %d files%s\n")

363

" with %d changes to %d files%s\n")

364

% (changesets, revisions, files, htext))

364

% (changesets, revisions, files, htext))

365

repo.invalidatevolatilesets()

365

repo.invalidatevolatilesets()

366

367

if changesets > 0:

367

if changesets > 0:

368

if 'node' not in tr.hookargs:

368

if 'node' not in tr.hookargs:

369

tr.hookargs['node'] = hex(cl.node(clstart))

369

tr.hookargs['node'] = hex(cl.node(clstart))

370

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

370

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

371

hookargs = dict(tr.hookargs)

371

hookargs = dict(tr.hookargs)

372

else:

372

else:

373

hookargs = dict(tr.hookargs)

373

hookargs = dict(tr.hookargs)

374

hookargs['node'] = hex(cl.node(clstart))

374

hookargs['node'] = hex(cl.node(clstart))

375

hookargs['node_last'] = hex(cl.node(clend - 1))

375

hookargs['node_last'] = hex(cl.node(clend - 1))

376

repo.hook('pretxnchangegroup',

376

repo.hook('pretxnchangegroup',

377

throw=True, **pycompat.strkwargs(hookargs))

377

throw=True, **pycompat.strkwargs(hookargs))

378

379

added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]

379

added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]

380

phaseall = None

380

phaseall = None

381

if srctype in ('push', 'serve'):

381

if srctype in ('push', 'serve'):

382

# Old servers can not push the boundary themselves.

382

# Old servers can not push the boundary themselves.

383

# New servers won't push the boundary if changeset already

383

# New servers won't push the boundary if changeset already

384

# exists locally as secret

384

# exists locally as secret

385

#

385

#

386

# We should not use added here but the list of all change in

386

# We should not use added here but the list of all change in

387

# the bundle

387

# the bundle

388

if repo.publishing():

388

if repo.publishing():

389

targetphase = phaseall = phases.public

389

targetphase = phaseall = phases.public

390

else:

390

else:

391

# closer target phase computation

391

# closer target phase computation

392

393

# Those changesets have been pushed from the

393

# Those changesets have been pushed from the

394

# outside, their phases are going to be pushed

394

# outside, their phases are going to be pushed

395

# alongside. Therefor `targetphase` is

395

# alongside. Therefor `targetphase` is

396

# ignored.

396

# ignored.

397

targetphase = phaseall = phases.draft

397

targetphase = phaseall = phases.draft

398

if added:

398

if added:

399

phases.registernew(repo, tr, targetphase, added)

399

phases.registernew(repo, tr, targetphase, added)

400

if phaseall is not None:

400

if phaseall is not None:

401

phases.advanceboundary(repo, tr, phaseall, cgnodes)

401

phases.advanceboundary(repo, tr, phaseall, cgnodes)

402

403

if changesets > 0:

403

if changesets > 0:

404

405

def runhooks():

405

def runhooks():

406

# These hooks run when the lock releases, not when the

406

# These hooks run when the lock releases, not when the

407

# transaction closes. So it's possible for the changelog

407

# transaction closes. So it's possible for the changelog

408

# to have changed since we last saw it.

408

# to have changed since we last saw it.

409

if clstart >= len(repo):

409

if clstart >= len(repo):

410

return

410

return

411

412

repo.hook("changegroup", **pycompat.strkwargs(hookargs))

412

repo.hook("changegroup", **pycompat.strkwargs(hookargs))

413

414

for n in added:

414

for n in added:

415

args = hookargs.copy()

415

args = hookargs.copy()

416

args['node'] = hex(n)

416

args['node'] = hex(n)

417

del args['node_last']

417

del args['node_last']

418

repo.hook("incoming", **pycompat.strkwargs(args))

418

repo.hook("incoming", **pycompat.strkwargs(args))

419

420

newheads = [h for h in repo.heads()

420

newheads = [h for h in repo.heads()

421

if h not in oldheads]

421

if h not in oldheads]

422

repo.ui.log("incoming",

422

repo.ui.log("incoming",

423

"%d incoming changes - new heads: %s\n",

423

"%d incoming changes - new heads: %s\n",

424

len(added),

424

len(added),

425

', '.join([hex(c[:6]) for c in newheads]))

425

', '.join([hex(c[:6]) for c in newheads]))

426

427

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

427

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

428

lambda tr: repo._afterlock(runhooks))

428

lambda tr: repo._afterlock(runhooks))

429

finally:

429

finally:

430

repo.ui.flush()

430

repo.ui.flush()

431

# never return 0 here:

431

# never return 0 here:

432

if deltaheads < 0:

432

if deltaheads < 0:

433

ret = deltaheads - 1

433

ret = deltaheads - 1

434

else:

434

else:

435

ret = deltaheads + 1

435

ret = deltaheads + 1

436

return ret

436

return ret

437

438

def deltaiter(self):

438

def deltaiter(self):

439

"""

439

"""

440

returns an iterator of the deltas in this changegroup

440

returns an iterator of the deltas in this changegroup

441

442

Useful for passing to the underlying storage system to be stored.

442

Useful for passing to the underlying storage system to be stored.

443

"""

443

"""

444

chain = None

444

chain = None

445

for chunkdata in iter(lambda: self.deltachunk(chain), {}):

445

for chunkdata in iter(lambda: self.deltachunk(chain), {}):

446

# Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)

446

# Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)

447

yield chunkdata

447

yield chunkdata

448

chain = chunkdata[0]

448

chain = chunkdata[0]

449

450

class cg2unpacker(cg1unpacker):

450

class cg2unpacker(cg1unpacker):

451

"""Unpacker for cg2 streams.

451

"""Unpacker for cg2 streams.

452

453

cg2 streams add support for generaldelta, so the delta header

453

cg2 streams add support for generaldelta, so the delta header

454

format is slightly different. All other features about the data

454

format is slightly different. All other features about the data

455

remain the same.

455

remain the same.

456

"""

456

"""

457

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

457

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

458

deltaheadersize = deltaheader.size

458

deltaheadersize = deltaheader.size

459

version = '02'

459

version = '02'

460

461

def _deltaheader(self, headertuple, prevnode):

461

def _deltaheader(self, headertuple, prevnode):

462

node, p1, p2, deltabase, cs = headertuple

462

node, p1, p2, deltabase, cs = headertuple

463

flags = 0

463

flags = 0

464

return node, p1, p2, deltabase, cs, flags

464

return node, p1, p2, deltabase, cs, flags

465

466

class cg3unpacker(cg2unpacker):

466

class cg3unpacker(cg2unpacker):

467

"""Unpacker for cg3 streams.

467

"""Unpacker for cg3 streams.

468

469

cg3 streams add support for exchanging treemanifests and revlog

469

cg3 streams add support for exchanging treemanifests and revlog

470

flags. It adds the revlog flags to the delta header and an empty chunk

470

flags. It adds the revlog flags to the delta header and an empty chunk

471

separating manifests and files.

471

separating manifests and files.

472

"""

472

"""

473

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

473

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

474

deltaheadersize = deltaheader.size

474

deltaheadersize = deltaheader.size

475

version = '03'

475

version = '03'

476

_grouplistcount = 2 # One list of manifests and one list of files

476

_grouplistcount = 2 # One list of manifests and one list of files

477

478

def _deltaheader(self, headertuple, prevnode):

478

def _deltaheader(self, headertuple, prevnode):

479

node, p1, p2, deltabase, cs, flags = headertuple

479

node, p1, p2, deltabase, cs, flags = headertuple

480

return node, p1, p2, deltabase, cs, flags

480

return node, p1, p2, deltabase, cs, flags

481

482

def _unpackmanifests(self, repo, revmap, trp, prog):

482

def _unpackmanifests(self, repo, revmap, trp, prog):

483

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)

483

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)

484

for chunkdata in iter(self.filelogheader, {}):

484

for chunkdata in iter(self.filelogheader, {}):

485

# If we get here, there are directory manifests in the changegroup

485

# If we get here, there are directory manifests in the changegroup

486

d = chunkdata["filename"]

486

d = chunkdata["filename"]

487

repo.ui.debug("adding %s revisions\n" % d)

487

repo.ui.debug("adding %s revisions\n" % d)

488

dirlog = repo.manifestlog._revlog.dirlog(d)

488

dirlog = repo.manifestlog._revlog.dirlog(d)

489

deltas = self.deltaiter()

489

deltas = self.deltaiter()

490

if not dirlog.addgroup(deltas, revmap, trp):

490

if not dirlog.addgroup(deltas, revmap, trp):

491

raise error.Abort(_("received dir revlog group is empty"))

491

raise error.Abort(_("received dir revlog group is empty"))

492

493

class headerlessfixup(object):

493

class headerlessfixup(object):

494

def __init__(self, fh, h):

494

def __init__(self, fh, h):

495

self._h = h

495

self._h = h

496

self._fh = fh

496

self._fh = fh

497

def read(self, n):

497

def read(self, n):

498

if self._h:

498

if self._h:

499

d, self._h = self._h[:n], self._h[n:]

499

d, self._h = self._h[:n], self._h[n:]

500

if len(d) < n:

500

if len(d) < n:

501

d += readexactly(self._fh, n - len(d))

501

d += readexactly(self._fh, n - len(d))

502

return d

502

return d

503

return readexactly(self._fh, n)

503

return readexactly(self._fh, n)

504

505

@attr.s(slots=True, frozen=True)

505

@attr.s(slots=True, frozen=True)

506

class revisiondelta(object):

506

class revisiondelta(object):

507

"""Describes a delta entry in a changegroup.

507

"""Describes a delta entry in a changegroup.

508

509

Captured data is sufficient to serialize the delta into multiple

509

Captured data is sufficient to serialize the delta into multiple

510

formats.

510

formats.

511

"""

511

"""

512

# 20 byte node of this revision.

512

# 20 byte node of this revision.

513

node = attr.ib()

513

node = attr.ib()

514

# 20 byte nodes of parent revisions.

514

# 20 byte nodes of parent revisions.

515

p1node = attr.ib()

515

p1node = attr.ib()

516

p2node = attr.ib()

516

p2node = attr.ib()

517

# 20 byte node of node this delta is against.

517

# 20 byte node of node this delta is against.

518

basenode = attr.ib()

518

basenode = attr.ib()

519

# 20 byte node of changeset revision this delta is associated with.

519

# 20 byte node of changeset revision this delta is associated with.

520

linknode = attr.ib()

520

linknode = attr.ib()

521

# 2 bytes of flags to apply to revision data.

521

# 2 bytes of flags to apply to revision data.

522

flags = attr.ib()

522

flags = attr.ib()

523

# Iterable of chunks holding raw delta data.

523

# Iterable of chunks holding raw delta data.

524

deltachunks = attr.ib()

524

deltachunks = attr.ib()

525

526

def _sortnodesnormal(store, nodes, reorder):

527

"""Sort nodes for changegroup generation and turn into revnums."""

528

# for generaldelta revlogs, we linearize the revs; this will both be

529

# much quicker and generate a much smaller bundle

530

if (store._generaldelta and reorder is None) or reorder:

531

dag = dagutil.revlogdag(store)

532

return dag.linearize(set(store.rev(n) for n in nodes))

533

else:

534

return sorted([store.rev(n) for n in nodes])

535

536

def _sortnodesellipsis(store, nodes, clnodetorev, lookup):

537

"""Sort nodes for changegroup generation and turn into revnums."""

538

# Ellipses serving mode.

539

#

540

# In a perfect world, we'd generate better ellipsis-ified graphs

541

# for non-changelog revlogs. In practice, we haven't started doing

542

# that yet, so the resulting DAGs for the manifestlog and filelogs

543

# are actually full of bogus parentage on all the ellipsis

544

# nodes. This has the side effect that, while the contents are

545

# correct, the individual DAGs might be completely out of whack in

546

# a case like 882681bc3166 and its ancestors (back about 10

547

# revisions or so) in the main hg repo.

548

#

549

# The one invariant we *know* holds is that the new (potentially

550

# bogus) DAG shape will be valid if we order the nodes in the

551

# order that they're introduced in dramatis personae by the

552

# changelog, so what we do is we sort the non-changelog histories

553

# by the order in which they are used by the changelog.

554

key = lambda n: clnodetorev[lookup(n)]

555

return [store.rev(n) for n in sorted(nodes, key=key)]

556

526

class cgpacker(object):

557

class cgpacker(object):

527

def __init__(self, repo, filematcher, version, allowreorder,

558

def __init__(self, repo, filematcher, version, allowreorder,

528

deltaparentfn, builddeltaheader, manifestsend,

559

deltaparentfn, builddeltaheader, manifestsend,

529

bundlecaps=None, ellipses=False,

560

bundlecaps=None, ellipses=False,

530

shallow=False, ellipsisroots=None, fullnodes=None):

561

shallow=False, ellipsisroots=None, fullnodes=None):

531

"""Given a source repo, construct a bundler.

562

"""Given a source repo, construct a bundler.

532

563

533

filematcher is a matcher that matches on files to include in the

564

filematcher is a matcher that matches on files to include in the

534

changegroup. Used to facilitate sparse changegroups.

565

changegroup. Used to facilitate sparse changegroups.

535

566

536

allowreorder controls whether reordering of revisions is allowed.

567

allowreorder controls whether reordering of revisions is allowed.

537

This value is used when ``bundle.reorder`` is ``auto`` or isn't

568

This value is used when ``bundle.reorder`` is ``auto`` or isn't

538

set.

569

set.

539

570

540

deltaparentfn is a callable that resolves the delta parent for

571

deltaparentfn is a callable that resolves the delta parent for

541

a specific revision.

572

a specific revision.

542

573

543

builddeltaheader is a callable that constructs the header for a group

574

builddeltaheader is a callable that constructs the header for a group

544

delta.

575

delta.

545

576

546

manifestsend is a chunk to send after manifests have been fully emitted.

577

manifestsend is a chunk to send after manifests have been fully emitted.

547

578

548

ellipses indicates whether ellipsis serving mode is enabled.

579

ellipses indicates whether ellipsis serving mode is enabled.

549

580

550

bundlecaps is optional and can be used to specify the set of

581

bundlecaps is optional and can be used to specify the set of

551

capabilities which can be used to build the bundle. While bundlecaps is

582

capabilities which can be used to build the bundle. While bundlecaps is

552

unused in core Mercurial, extensions rely on this feature to communicate

583

unused in core Mercurial, extensions rely on this feature to communicate

553

capabilities to customize the changegroup packer.

584

capabilities to customize the changegroup packer.

554

585

555

shallow indicates whether shallow data might be sent. The packer may

586

shallow indicates whether shallow data might be sent. The packer may

556

need to pack file contents not introduced by the changes being packed.

587

need to pack file contents not introduced by the changes being packed.

557

588

558

fullnodes is the list of nodes which should not be ellipsis nodes. We

589

fullnodes is the list of nodes which should not be ellipsis nodes. We

559

store this rather than the set of nodes that should be ellipsis because

590

store this rather than the set of nodes that should be ellipsis because

560

for very large histories we expect this to be significantly smaller.

591

for very large histories we expect this to be significantly smaller.

561

"""

592

"""

562

assert filematcher

593

assert filematcher

563

self._filematcher = filematcher

594

self._filematcher = filematcher

564

595

565

self.version = version

596

self.version = version

566

self._deltaparentfn = deltaparentfn

597

self._deltaparentfn = deltaparentfn

567

self._builddeltaheader = builddeltaheader

598

self._builddeltaheader = builddeltaheader

568

self._manifestsend = manifestsend

599

self._manifestsend = manifestsend

569

self._ellipses = ellipses

600

self._ellipses = ellipses

570

601

571

# Set of capabilities we can use to build the bundle.

602

# Set of capabilities we can use to build the bundle.

572

if bundlecaps is None:

603

if bundlecaps is None:

573

bundlecaps = set()

604

bundlecaps = set()

574

self._bundlecaps = bundlecaps

605

self._bundlecaps = bundlecaps

575

self._isshallow = shallow

606

self._isshallow = shallow

576

self._fullnodes = fullnodes

607

self._fullnodes = fullnodes

577

608

578

# Maps ellipsis revs to their roots at the changelog level.

609

# Maps ellipsis revs to their roots at the changelog level.

579

self._precomputedellipsis = ellipsisroots

610

self._precomputedellipsis = ellipsisroots

580

611

581

# experimental config: bundle.reorder

612

# experimental config: bundle.reorder

582

reorder = repo.ui.config('bundle', 'reorder')

613

reorder = repo.ui.config('bundle', 'reorder')

583

if reorder == 'auto':

614

if reorder == 'auto':

584

self._reorder = allowreorder

615

self._reorder = allowreorder

585

else:

616

else:

586

self._reorder = stringutil.parsebool(reorder)

617

self._reorder = stringutil.parsebool(reorder)

587

618

588

self._repo = repo

619

self._repo = repo

589

620

590

if self._repo.ui.verbose and not self._repo.ui.debugflag:

621

if self._repo.ui.verbose and not self._repo.ui.debugflag:

591

self._verbosenote = self._repo.ui.note

622

self._verbosenote = self._repo.ui.note

592

else:

623

else:

593

self._verbosenote = lambda s: None

624

self._verbosenote = lambda s: None

594

625

595

# Maps CL revs to per-revlog revisions. Cleared in close() at

626

# Maps CL revs to per-revlog revisions. Cleared in close() at

596

# the end of each group.

627

# the end of each group.

597

self._clrevtolocalrev = {}

628

self._clrevtolocalrev = {}

598

self._nextclrevtolocalrev = {}

629

self._nextclrevtolocalrev = {}

599

630

600

# Maps changelog nodes to changelog revs. Filled in once

631

# Maps changelog nodes to changelog revs. Filled in once

601

# during changelog stage and then left unmodified.

632

# during changelog stage and then left unmodified.

602

self._clnodetorev = {}

633

self._clnodetorev = {}

603

634

604

def _close(self):

635

def _close(self):

605

# Ellipses serving mode.

636

# Ellipses serving mode.

606

self._clrevtolocalrev.clear()

637

self._clrevtolocalrev.clear()

607

if self._nextclrevtolocalrev is not None:

638

if self._nextclrevtolocalrev is not None:

608

self._clrevtolocalrev = self._nextclrevtolocalrev

639

self._clrevtolocalrev = self._nextclrevtolocalrev

609

self._nextclrevtolocalrev = None

640

self._nextclrevtolocalrev = None

610

641

611

return closechunk()

642

return closechunk()

612

643

613

# Extracted both for clarity and for overriding in extensions.

644

def group(self, revs, store, ischangelog, lookup, units=None):

614

def _sortgroup(self, store, ischangelog, nodelist, lookup):

615

"""Sort nodes for change group and turn them into revnums."""

616

# Ellipses serving mode.

617

#

618

# In a perfect world, we'd generate better ellipsis-ified graphs

619

# for non-changelog revlogs. In practice, we haven't started doing

620

# that yet, so the resulting DAGs for the manifestlog and filelogs

621

# are actually full of bogus parentage on all the ellipsis

622

# nodes. This has the side effect that, while the contents are

623

# correct, the individual DAGs might be completely out of whack in

624

# a case like 882681bc3166 and its ancestors (back about 10

625

# revisions or so) in the main hg repo.

626

#

627

# The one invariant we *know* holds is that the new (potentially

628

# bogus) DAG shape will be valid if we order the nodes in the

629

# order that they're introduced in dramatis personae by the

630

# changelog, so what we do is we sort the non-changelog histories

631

# by the order in which they are used by the changelog.

632

if self._ellipses and not ischangelog:

633

key = lambda n: self._clnodetorev[lookup(n)]

634

return [store.rev(n) for n in sorted(nodelist, key=key)]

635

636

# for generaldelta revlogs, we linearize the revs; this will both be

637

# much quicker and generate a much smaller bundle

638

if (store._generaldelta and self._reorder is None) or self._reorder:

639

dag = dagutil.revlogdag(store)

640

return dag.linearize(set(store.rev(n) for n in nodelist))

641

else:

642

return sorted([store.rev(n) for n in nodelist])

643

644

def group(self, nodelist, store, ischangelog, lookup, units=None):

645

"""Calculate a delta group, yielding a sequence of changegroup chunks

645

"""Calculate a delta group, yielding a sequence of changegroup chunks

646

(strings).

646

(strings).

647

648

Given a list of changeset revs, return a set of deltas and

648

Given a list of changeset revs, return a set of deltas and

649

metadata corresponding to nodes. The first delta is

649

metadata corresponding to nodes. The first delta is

650

first parent(nodelist[0]) -> nodelist[0], the receiver is

650

first parent(nodelist[0]) -> nodelist[0], the receiver is

651

guaranteed to have this parent as it has all history before

651

guaranteed to have this parent as it has all history before

652

these changesets. In the case firstparent is nullrev the

652

these changesets. In the case firstparent is nullrev the

653

changegroup starts with a full revision.

653

changegroup starts with a full revision.

654

655

If units is not None, progress detail will be generated, units specifies

655

If units is not None, progress detail will be generated, units specifies

656

the type of revlog that is touched (changelog, manifest, etc.).

656

the type of revlog that is touched (changelog, manifest, etc.).

657

"""

657

"""

658

# if we don't have any revisions touched by these changesets, bail

658

# if we don't have any revisions touched by these changesets, bail

659

if len(~~nodelist~~) == 0:

659

if len(revs) == 0:

660

yield self._close()

660

yield self._close()

661

return

661

return

662

663

revs = self._sortgroup(store, ischangelog, nodelist, lookup)

664

665

# add the parent of the first rev

663

# add the parent of the first rev

666

p = store.parentrevs(revs[0])[0]

664

p = store.parentrevs(revs[0])[0]

667

revs.insert(0, p)

665

revs.insert(0, p)

668

666

669

# build deltas

667

# build deltas

670

progress = None

668

progress = None

671

if units is not None:

669

if units is not None:

672

progress = self._repo.ui.makeprogress(_('bundling'), unit=units,

670

progress = self._repo.ui.makeprogress(_('bundling'), unit=units,

673

total=(len(revs) - 1))

671

total=(len(revs) - 1))

674

for r in pycompat.xrange(len(revs) - 1):

672

for r in pycompat.xrange(len(revs) - 1):

675

if progress:

673

if progress:

676

progress.update(r + 1)

674

progress.update(r + 1)

677

prev, curr = revs[r], revs[r + 1]

675

prev, curr = revs[r], revs[r + 1]

678

linknode = lookup(store.node(curr))

676

linknode = lookup(store.node(curr))

679

for c in self._revchunk(store, ischangelog, curr, prev, linknode):

677

for c in self._revchunk(store, ischangelog, curr, prev, linknode):

680

yield c

678

yield c

681

679

682

if progress:

680

if progress:

683

progress.complete()

681

progress.complete()

684

yield self._close()

682

yield self._close()

685

683

686

# filter any nodes that claim to be part of the known set

684

# filter any nodes that claim to be part of the known set

687

def _prune(self, store, missing, commonrevs):

685

def _prune(self, store, missing, commonrevs):

688

# TODO this violates storage abstraction for manifests.

686

# TODO this violates storage abstraction for manifests.

689

if isinstance(store, manifest.manifestrevlog):

687

if isinstance(store, manifest.manifestrevlog):

690

if not self._filematcher.visitdir(store._dir[:-1] or '.'):

688

if not self._filematcher.visitdir(store._dir[:-1] or '.'):

691

return []

689

return []

692

690

693

rr, rl = store.rev, store.linkrev

691

rr, rl = store.rev, store.linkrev

694

return [n for n in missing if rl(rr(n)) not in commonrevs]

692

return [n for n in missing if rl(rr(n)) not in commonrevs]

695

693

696

def _packmanifests(self, dir, ~~mfnode~~s, lookuplinknode):

694

def _packmanifests(self, dir, dirlog, revs, lookuplinknode):

697

"""Pack manifests into a changegroup stream.

695

"""Pack manifests into a changegroup stream.

698

696

699

Encodes the directory name in the output so multiple manifests

697

Encodes the directory name in the output so multiple manifests

700

can be sent. Multiple manifests is not supported by cg1 and cg2.

698

can be sent. Multiple manifests is not supported by cg1 and cg2.

701

"""

699

"""

702

703

if dir:

700

if dir:

704

assert self.version == b'03'

701

assert self.version == b'03'

705

yield _fileheader(dir)

702

yield _fileheader(dir)

706

703

707

# TODO violates storage abstractions by assuming revlogs.

704

for chunk in self.group(revs, dirlog, False, lookuplinknode,

708

dirlog = self._repo.manifestlog._revlog.dirlog(dir)

709

for chunk in self.group(mfnodes, dirlog, False, lookuplinknode,

710

units=_('manifests')):

705

units=_('manifests')):

711

yield chunk

706

yield chunk

712

707

713

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

708

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

714

"""Yield a sequence of changegroup byte chunks."""

709

"""Yield a sequence of changegroup byte chunks."""

715

710

716

repo = self._repo

711

repo = self._repo

717

cl = repo.changelog

712

cl = repo.changelog

718

713

719

self._verbosenote(_('uncompressed size of bundle content:\n'))

714

self._verbosenote(_('uncompressed size of bundle content:\n'))

720

size = 0

715

size = 0

721

716

722

clstate, chunks = self._generatechangelog(cl, clnodes)

717

clstate, chunks = self._generatechangelog(cl, clnodes)

723

for chunk in chunks:

718

for chunk in chunks:

724

size += len(chunk)

719

size += len(chunk)

725

yield chunk

720

yield chunk

726

721

727

self._verbosenote(_('%8.i (changelog)\n') % size)

722

self._verbosenote(_('%8.i (changelog)\n') % size)

728

723

729

clrevorder = clstate['clrevorder']

724

clrevorder = clstate['clrevorder']

730

mfs = clstate['mfs']

725

mfs = clstate['mfs']

731

changedfiles = clstate['changedfiles']

726

changedfiles = clstate['changedfiles']

732

727

733

# We need to make sure that the linkrev in the changegroup refers to

728

# We need to make sure that the linkrev in the changegroup refers to

734

# the first changeset that introduced the manifest or file revision.

729

# the first changeset that introduced the manifest or file revision.

735

# The fastpath is usually safer than the slowpath, because the filelogs

730

# The fastpath is usually safer than the slowpath, because the filelogs

736

# are walked in revlog order.

731

# are walked in revlog order.

737

#

732

#

738

# When taking the slowpath with reorder=None and the manifest revlog

733

# When taking the slowpath with reorder=None and the manifest revlog

739

# uses generaldelta, the manifest may be walked in the "wrong" order.

734

# uses generaldelta, the manifest may be walked in the "wrong" order.

740

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

735

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

741

# cc0ff93d0c0c).

736

# cc0ff93d0c0c).

742

#

737

#

743

# When taking the fastpath, we are only vulnerable to reordering

738

# When taking the fastpath, we are only vulnerable to reordering

744

# of the changelog itself. The changelog never uses generaldelta, so

739

# of the changelog itself. The changelog never uses generaldelta, so

745

# it is only reordered when reorder=True. To handle this case, we

740

# it is only reordered when reorder=True. To handle this case, we

746

# simply take the slowpath, which already has the 'clrevorder' logic.

741

# simply take the slowpath, which already has the 'clrevorder' logic.

747

# This was also fixed in cc0ff93d0c0c.

742

# This was also fixed in cc0ff93d0c0c.

748

fastpathlinkrev = fastpathlinkrev and not self._reorder

743

fastpathlinkrev = fastpathlinkrev and not self._reorder

749

# Treemanifests don't work correctly with fastpathlinkrev

744

# Treemanifests don't work correctly with fastpathlinkrev

750

# either, because we don't discover which directory nodes to

745

# either, because we don't discover which directory nodes to

751

# send along with files. This could probably be fixed.

746

# send along with files. This could probably be fixed.

752

fastpathlinkrev = fastpathlinkrev and (

747

fastpathlinkrev = fastpathlinkrev and (

753

'treemanifest' not in repo.requirements)

748

'treemanifest' not in repo.requirements)

754

749

755

fnodes = {} # needed file nodes

750

fnodes = {} # needed file nodes

756

751

757

for chunk in self.generatemanifests(commonrevs, clrevorder,

752

for chunk in self.generatemanifests(commonrevs, clrevorder,

758

fastpathlinkrev, mfs, fnodes, source):

753

fastpathlinkrev, mfs, fnodes, source):

759

yield chunk

754

yield chunk

760

755

761

if self._ellipses:

756

if self._ellipses:

762

mfdicts = None

757

mfdicts = None

763

if self._isshallow:

758

if self._isshallow:

764

mfdicts = [(self._repo.manifestlog[n].read(), lr)

759

mfdicts = [(self._repo.manifestlog[n].read(), lr)

765

for (n, lr) in mfs.iteritems()]

760

for (n, lr) in mfs.iteritems()]

766

761

767

mfs.clear()

762

mfs.clear()

768

clrevs = set(cl.rev(x) for x in clnodes)

763

clrevs = set(cl.rev(x) for x in clnodes)

769

764

770

if not fastpathlinkrev:

765

if not fastpathlinkrev:

771

def linknodes(unused, fname):

766

def linknodes(unused, fname):

772

return fnodes.get(fname, {})

767

return fnodes.get(fname, {})

773

else:

768

else:

774

cln = cl.node

769

cln = cl.node

775

def linknodes(filerevlog, fname):

770

def linknodes(filerevlog, fname):

776

llr = filerevlog.linkrev

771

llr = filerevlog.linkrev

777

fln = filerevlog.node

772

fln = filerevlog.node

778

revs = ((r, llr(r)) for r in filerevlog)

773

revs = ((r, llr(r)) for r in filerevlog)

779

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

774

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

780

775

781

if self._ellipses:

776

if self._ellipses:

782

# We need to pass the mfdicts variable down into

777

# We need to pass the mfdicts variable down into

783

# generatefiles(), but more than one command might have

778

# generatefiles(), but more than one command might have

784

# wrapped generatefiles so we can't modify the function

779

# wrapped generatefiles so we can't modify the function

785

# signature. Instead, we pass the data to ourselves using an

780

# signature. Instead, we pass the data to ourselves using an

786

# instance attribute. I'm sorry.

781

# instance attribute. I'm sorry.

787

self._mfdicts = mfdicts

782

self._mfdicts = mfdicts

788

783

789

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

784

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

790

source):

785

source):

791

yield chunk

786

yield chunk

792

787

793

yield self._close()

788

yield self._close()

794

789

795

if clnodes:

790

if clnodes:

796

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

791

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

797

792

798

def _generatechangelog(self, cl, nodes):

793

def _generatechangelog(self, cl, nodes):

799

"""Generate data for changelog chunks.

794

"""Generate data for changelog chunks.

800

795

801

Returns a 2-tuple of a dict containing state and an iterable of

796

Returns a 2-tuple of a dict containing state and an iterable of

802

byte chunks. The state will not be fully populated until the

797

byte chunks. The state will not be fully populated until the

803

chunk stream has been fully consumed.

798

chunk stream has been fully consumed.

804

"""

799

"""

805

clrevorder = {}

800

clrevorder = {}

806

mfs = {} # needed manifests

801

mfs = {} # needed manifests

807

mfl = self._repo.manifestlog

802

mfl = self._repo.manifestlog

808

# TODO violates storage abstraction.

803

# TODO violates storage abstraction.

809

mfrevlog = mfl._revlog

804

mfrevlog = mfl._revlog

810

changedfiles = set()

805

changedfiles = set()

811

806

812

# Callback for the changelog, used to collect changed files and

807

# Callback for the changelog, used to collect changed files and

813

# manifest nodes.

808

# manifest nodes.

814

# Returns the linkrev node (identity in the changelog case).

809

# Returns the linkrev node (identity in the changelog case).

815

def lookupcl(x):

810

def lookupcl(x):

816

c = cl.read(x)

811

c = cl.read(x)

817

clrevorder[x] = len(clrevorder)

812

clrevorder[x] = len(clrevorder)

818

813

819

if self._ellipses:

814

if self._ellipses:

820

# Only update mfs if x is going to be sent. Otherwise we

815

# Only update mfs if x is going to be sent. Otherwise we

821

# end up with bogus linkrevs specified for manifests and

816

# end up with bogus linkrevs specified for manifests and

822

# we skip some manifest nodes that we should otherwise

817

# we skip some manifest nodes that we should otherwise

823

# have sent.

818

# have sent.

824

if (x in self._fullnodes

819

if (x in self._fullnodes

825

or cl.rev(x) in self._precomputedellipsis):

820

or cl.rev(x) in self._precomputedellipsis):

826

n = c[0]

821

n = c[0]

827

# Record the first changeset introducing this manifest

822

# Record the first changeset introducing this manifest

828

# version.

823

# version.

829

mfs.setdefault(n, x)

824

mfs.setdefault(n, x)

830

# Set this narrow-specific dict so we have the lowest

825

# Set this narrow-specific dict so we have the lowest

831

# manifest revnum to look up for this cl revnum. (Part of

826

# manifest revnum to look up for this cl revnum. (Part of

832

# mapping changelog ellipsis parents to manifest ellipsis

827

# mapping changelog ellipsis parents to manifest ellipsis

833

# parents)

828

# parents)

834

self._nextclrevtolocalrev.setdefault(cl.rev(x),

829

self._nextclrevtolocalrev.setdefault(cl.rev(x),

835

mfrevlog.rev(n))

830

mfrevlog.rev(n))

836

# We can't trust the changed files list in the changeset if the

831

# We can't trust the changed files list in the changeset if the

837

# client requested a shallow clone.

832

# client requested a shallow clone.

838

if self._isshallow:

833

if self._isshallow:

839

changedfiles.update(mfl[c[0]].read().keys())

834

changedfiles.update(mfl[c[0]].read().keys())

840

else:

835

else:

841

changedfiles.update(c[3])

836

changedfiles.update(c[3])

842

else:

837

else:

843

838

844

n = c[0]

839

n = c[0]

845

# record the first changeset introducing this manifest version

840

# record the first changeset introducing this manifest version

846

mfs.setdefault(n, x)

841

mfs.setdefault(n, x)

847

# Record a complete list of potentially-changed files in

842

# Record a complete list of potentially-changed files in

848

# this manifest.

843

# this manifest.

849

changedfiles.update(c[3])

844

changedfiles.update(c[3])

850

845

851

return x

846

return x

852

847

848

# Changelog doesn't benefit from reordering revisions. So send out

849

# revisions in store order.

850

revs = sorted(cl.rev(n) for n in nodes)

851

853

state = {

852

state = {

854

'clrevorder': clrevorder,

853

'clrevorder': clrevorder,

855

'mfs': mfs,

854

'mfs': mfs,

856

'changedfiles': changedfiles,

855

'changedfiles': changedfiles,

857

}

856

}

858

857

859

gen = self.group(~~node~~s, cl, True, lookupcl, units=_('changesets'))

858

gen = self.group(revs, cl, True, lookupcl, units=_('changesets'))

860

859

861

return state, gen

860

return state, gen

862

861

863

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

862

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

864

fnodes, source):

863

fnodes, source):

865

"""Returns an iterator of changegroup chunks containing manifests.

864

"""Returns an iterator of changegroup chunks containing manifests.

866

865

867

`source` is unused here, but is used by extensions like remotefilelog to

866

`source` is unused here, but is used by extensions like remotefilelog to

868

change what is sent based in pulls vs pushes, etc.

867

change what is sent based in pulls vs pushes, etc.

869

"""

868

"""

870

repo = self._repo

869

repo = self._repo

871

mfl = repo.manifestlog

870

mfl = repo.manifestlog

872

dirlog = mfl._revlog.dirlog

871

dirlog = mfl._revlog.dirlog

873

tmfnodes = {'': mfs}

872

tmfnodes = {'': mfs}

874

873

875

# Callback for the manifest, used to collect linkrevs for filelog

874

# Callback for the manifest, used to collect linkrevs for filelog

876

# revisions.

875

# revisions.

877

# Returns the linkrev node (collected in lookupcl).

876

# Returns the linkrev node (collected in lookupcl).

878

def makelookupmflinknode(dir, nodes):

877

def makelookupmflinknode(dir, nodes):

879

if fastpathlinkrev:

878

if fastpathlinkrev:

880

assert not dir

879

assert not dir

881

return mfs.__getitem__

880

return mfs.__getitem__

882

881

883

def lookupmflinknode(x):

882

def lookupmflinknode(x):

884

"""Callback for looking up the linknode for manifests.

883

"""Callback for looking up the linknode for manifests.

885

884

886

Returns the linkrev node for the specified manifest.

885

Returns the linkrev node for the specified manifest.

887

886

888

SIDE EFFECT:

887

SIDE EFFECT:

889

888

890

1) fclnodes gets populated with the list of relevant

889

1) fclnodes gets populated with the list of relevant

891

file nodes if we're not using fastpathlinkrev

890

file nodes if we're not using fastpathlinkrev

892

2) When treemanifests are in use, collects treemanifest nodes

891

2) When treemanifests are in use, collects treemanifest nodes

893

to send

892

to send

894

893

895

Note that this means manifests must be completely sent to

894

Note that this means manifests must be completely sent to

896

the client before you can trust the list of files and

895

the client before you can trust the list of files and

897

treemanifests to send.

896

treemanifests to send.

898

"""

897

"""

899

clnode = nodes[x]

898

clnode = nodes[x]

900

mdata = mfl.get(dir, x).readfast(shallow=True)

899

mdata = mfl.get(dir, x).readfast(shallow=True)

901

for p, n, fl in mdata.iterentries():

900

for p, n, fl in mdata.iterentries():

902

if fl == 't': # subdirectory manifest

901

if fl == 't': # subdirectory manifest

903

subdir = dir + p + '/'

902

subdir = dir + p + '/'

904

tmfclnodes = tmfnodes.setdefault(subdir, {})

903

tmfclnodes = tmfnodes.setdefault(subdir, {})

905

tmfclnode = tmfclnodes.setdefault(n, clnode)

904

tmfclnode = tmfclnodes.setdefault(n, clnode)

906

if clrevorder[clnode] < clrevorder[tmfclnode]:

905

if clrevorder[clnode] < clrevorder[tmfclnode]:

907

tmfclnodes[n] = clnode

906

tmfclnodes[n] = clnode

908

else:

907

else:

909

f = dir + p

908

f = dir + p

910

fclnodes = fnodes.setdefault(f, {})

909

fclnodes = fnodes.setdefault(f, {})

911

fclnode = fclnodes.setdefault(n, clnode)

910

fclnode = fclnodes.setdefault(n, clnode)

912

if clrevorder[clnode] < clrevorder[fclnode]:

911

if clrevorder[clnode] < clrevorder[fclnode]:

913

fclnodes[n] = clnode

912

fclnodes[n] = clnode

914

return clnode

913

return clnode

915

return lookupmflinknode

914

return lookupmflinknode

916

915

917

size = 0

916

size = 0

918

while tmfnodes:

917

while tmfnodes:

919

dir, nodes = tmfnodes.popitem()

918

dir, nodes = tmfnodes.popitem()

920

prunednodes = self._prune(dirlog(dir), nodes, commonrevs)

919

store = dirlog(dir)

920

prunednodes = self._prune(store, nodes, commonrevs)

921

if not dir or prunednodes:

921

if not dir or prunednodes:

922

for x in self._packmanifests(dir, prunednodes,

922

lookupfn = makelookupmflinknode(dir, nodes)

923

makelookupmflinknode(dir, nodes)):

923

924

if self._ellipses:

925

revs = _sortnodesellipsis(store, prunednodes,

926

self._clnodetorev, lookupfn)

927

else:

928

revs = _sortnodesnormal(store, prunednodes,

929

self._reorder)

930

931

for x in self._packmanifests(dir, store, revs, lookupfn):

924

size += len(x)

932

size += len(x)

925

yield x

933

yield x

926

self._verbosenote(_('%8.i (manifests)\n') % size)

934

self._verbosenote(_('%8.i (manifests)\n') % size)

927

yield self._manifestsend

935

yield self._manifestsend

928

936

929

# The 'source' parameter is useful for extensions

937

# The 'source' parameter is useful for extensions

930

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

938

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

931

changedfiles = list(filter(self._filematcher, changedfiles))

939

changedfiles = list(filter(self._filematcher, changedfiles))

932

940

933

if self._isshallow:

941

if self._isshallow:

934

# See comment in generate() for why this sadness is a thing.

942

# See comment in generate() for why this sadness is a thing.

935

mfdicts = self._mfdicts

943

mfdicts = self._mfdicts

936

del self._mfdicts

944

del self._mfdicts

937

# In a shallow clone, the linknodes callback needs to also include

945

# In a shallow clone, the linknodes callback needs to also include

938

# those file nodes that are in the manifests we sent but weren't

946

# those file nodes that are in the manifests we sent but weren't

939

# introduced by those manifests.

947

# introduced by those manifests.

940

commonctxs = [self._repo[c] for c in commonrevs]

948

commonctxs = [self._repo[c] for c in commonrevs]

941

oldlinknodes = linknodes

949

oldlinknodes = linknodes

942

clrev = self._repo.changelog.rev

950

clrev = self._repo.changelog.rev

943

951

944

# Defining this function has a side-effect of overriding the

952

# Defining this function has a side-effect of overriding the

945

# function of the same name that was passed in as an argument.

953

# function of the same name that was passed in as an argument.

946

# TODO have caller pass in appropriate function.

954

# TODO have caller pass in appropriate function.

947

def linknodes(flog, fname):

955

def linknodes(flog, fname):

948

for c in commonctxs:

956

for c in commonctxs:

949

try:

957

try:

950

fnode = c.filenode(fname)

958

fnode = c.filenode(fname)

951

self._clrevtolocalrev[c.rev()] = flog.rev(fnode)

959

self._clrevtolocalrev[c.rev()] = flog.rev(fnode)

952

except error.ManifestLookupError:

960

except error.ManifestLookupError:

953

pass

961

pass

954

links = oldlinknodes(flog, fname)

962

links = oldlinknodes(flog, fname)

955

if len(links) != len(mfdicts):

963

if len(links) != len(mfdicts):

956

for mf, lr in mfdicts:

964

for mf, lr in mfdicts:

957

fnode = mf.get(fname, None)

965

fnode = mf.get(fname, None)

958

if fnode in links:

966

if fnode in links:

959

links[fnode] = min(links[fnode], lr, key=clrev)

967

links[fnode] = min(links[fnode], lr, key=clrev)

960

elif fnode:

968

elif fnode:

961

links[fnode] = lr

969

links[fnode] = lr

962

return links

970

return links

963

971

964

return self._generatefiles(changedfiles, linknodes, commonrevs, source)

972

return self._generatefiles(changedfiles, linknodes, commonrevs, source)

965

973

966

def _generatefiles(self, changedfiles, linknodes, commonrevs, source):

974

def _generatefiles(self, changedfiles, linknodes, commonrevs, source):

967

repo = self._repo

975

repo = self._repo

968

progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),

976

progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),

969

total=len(changedfiles))

977

total=len(changedfiles))

970

for i, fname in enumerate(sorted(changedfiles)):

978

for i, fname in enumerate(sorted(changedfiles)):

971

filerevlog = repo.file(fname)

979

filerevlog = repo.file(fname)

972

if not filerevlog:

980

if not filerevlog:

973

raise error.Abort(_("empty or missing file data for %s") %

981

raise error.Abort(_("empty or missing file data for %s") %

974

fname)

982

fname)

975

983

976

linkrevnodes = linknodes(filerevlog, fname)

984

linkrevnodes = linknodes(filerevlog, fname)

977

# Lookup for filenodes, we collected the linkrev nodes above in the

985

# Lookup for filenodes, we collected the linkrev nodes above in the

978

# fastpath case and with lookupmf in the slowpath case.

986

# fastpath case and with lookupmf in the slowpath case.

979

def lookupfilelog(x):

987

def lookupfilelog(x):

980

return linkrevnodes[x]

988

return linkrevnodes[x]

981

989

982

filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)

990

filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)

983

if filenodes:

991

if filenodes:

992

if self._ellipses:

993

revs = _sortnodesellipsis(filerevlog, filenodes,

994

self._clnodetorev, lookupfilelog)

995

else:

996

revs = _sortnodesnormal(filerevlog, filenodes,

997

self._reorder)

998

984

progress.update(i + 1, item=fname)

999

progress.update(i + 1, item=fname)

985

h = _fileheader(fname)

1000

h = _fileheader(fname)

986

size = len(h)

1001

size = len(h)

987

yield h

1002

yield h

988

for chunk in self.group(~~filenode~~s, filerevlog, False,

1003

for chunk in self.group(revs, filerevlog, False, lookupfilelog):

989

lookupfilelog):

990

size += len(chunk)

1004

size += len(chunk)

991

yield chunk

1005

yield chunk

992

self._verbosenote(_('%8.i %s\n') % (size, fname))

1006

self._verbosenote(_('%8.i %s\n') % (size, fname))

993

progress.complete()

1007

progress.complete()

994

1008

995

def _revchunk(self, store, ischangelog, rev, prev, linknode):

1009

def _revchunk(self, store, ischangelog, rev, prev, linknode):

996

if self._ellipses:

1010

if self._ellipses:

997

fn = self._revisiondeltanarrow

1011

fn = self._revisiondeltanarrow

998

else:

1012

else:

999

fn = self._revisiondeltanormal

1013

fn = self._revisiondeltanormal

1000

1014

1001

delta = fn(store, ischangelog, rev, prev, linknode)

1015

delta = fn(store, ischangelog, rev, prev, linknode)

1002

if not delta:

1016

if not delta:

1003

return

1017

return

1004

1018

1005

meta = self._builddeltaheader(delta)

1019

meta = self._builddeltaheader(delta)

1006

l = len(meta) + sum(len(x) for x in delta.deltachunks)

1020

l = len(meta) + sum(len(x) for x in delta.deltachunks)

1007

1021

1008

yield chunkheader(l)

1022

yield chunkheader(l)

1009

yield meta

1023

yield meta

1010

for x in delta.deltachunks:

1024

for x in delta.deltachunks:

1011

yield x

1025

yield x

1012

1026

1013

def _revisiondeltanormal(self, store, ischangelog, rev, prev, linknode):

1027

def _revisiondeltanormal(self, store, ischangelog, rev, prev, linknode):

1014

node = store.node(rev)

1028

node = store.node(rev)

1015

p1, p2 = store.parentrevs(rev)

1029

p1, p2 = store.parentrevs(rev)

1016

base = self._deltaparentfn(store, rev, p1, p2, prev)

1030

base = self._deltaparentfn(store, rev, p1, p2, prev)

1017

1031

1018

prefix = ''

1032

prefix = ''

1019

if store.iscensored(base) or store.iscensored(rev):

1033

if store.iscensored(base) or store.iscensored(rev):

1020

try:

1034

try:

1021

delta = store.revision(node, raw=True)

1035

delta = store.revision(node, raw=True)

1022

except error.CensoredNodeError as e:

1036

except error.CensoredNodeError as e:

1023

delta = e.tombstone

1037

delta = e.tombstone

1024

if base == nullrev:

1038

if base == nullrev:

1025

prefix = mdiff.trivialdiffheader(len(delta))

1039

prefix = mdiff.trivialdiffheader(len(delta))

1026

else:

1040

else:

1027

baselen = store.rawsize(base)

1041

baselen = store.rawsize(base)

1028

prefix = mdiff.replacediffheader(baselen, len(delta))

1042

prefix = mdiff.replacediffheader(baselen, len(delta))

1029

elif base == nullrev:

1043

elif base == nullrev:

1030

delta = store.revision(node, raw=True)

1044

delta = store.revision(node, raw=True)

1031

prefix = mdiff.trivialdiffheader(len(delta))

1045

prefix = mdiff.trivialdiffheader(len(delta))

1032

else:

1046

else:

1033

delta = store.revdiff(base, rev)

1047

delta = store.revdiff(base, rev)

1034

p1n, p2n = store.parents(node)

1048

p1n, p2n = store.parents(node)

1035

1049

1036

return revisiondelta(

1050

return revisiondelta(

1037

node=node,

1051

node=node,

1038

p1node=p1n,

1052

p1node=p1n,

1039

p2node=p2n,

1053

p2node=p2n,

1040

basenode=store.node(base),

1054

basenode=store.node(base),

1041

linknode=linknode,

1055

linknode=linknode,

1042

flags=store.flags(rev),

1056

flags=store.flags(rev),

1043

deltachunks=(prefix, delta),

1057

deltachunks=(prefix, delta),

1044

)

1058

)

1045

1059

1046

def _revisiondeltanarrow(self, store, ischangelog, rev, prev, linknode):

1060

def _revisiondeltanarrow(self, store, ischangelog, rev, prev, linknode):

1047

# build up some mapping information that's useful later. See

1061

# build up some mapping information that's useful later. See

1048

# the local() nested function below.

1062

# the local() nested function below.

1049

if ischangelog:

1063

if ischangelog:

1050

self._clnodetorev[linknode] = rev

1064

self._clnodetorev[linknode] = rev

1051

linkrev = rev

1065

linkrev = rev

1052

self._clrevtolocalrev[linkrev] = rev

1066

self._clrevtolocalrev[linkrev] = rev

1053

else:

1067

else:

1054

linkrev = self._clnodetorev[linknode]

1068

linkrev = self._clnodetorev[linknode]

1055

self._clrevtolocalrev[linkrev] = rev

1069

self._clrevtolocalrev[linkrev] = rev

1056

1070

1057

# This is a node to send in full, because the changeset it

1071

# This is a node to send in full, because the changeset it

1058

# corresponds to was a full changeset.

1072

# corresponds to was a full changeset.

1059

if linknode in self._fullnodes:

1073

if linknode in self._fullnodes:

1060

return self._revisiondeltanormal(store, ischangelog, rev, prev,

1074

return self._revisiondeltanormal(store, ischangelog, rev, prev,

1061

linknode)

1075

linknode)

1062

1076

1063

# At this point, a node can either be one we should skip or an

1077

# At this point, a node can either be one we should skip or an

1064

# ellipsis. If it's not an ellipsis, bail immediately.

1078

# ellipsis. If it's not an ellipsis, bail immediately.

1065

if linkrev not in self._precomputedellipsis:

1079

if linkrev not in self._precomputedellipsis:

1066

return

1080

return

1067

1081

1068

linkparents = self._precomputedellipsis[linkrev]

1082

linkparents = self._precomputedellipsis[linkrev]

1069

def local(clrev):

1083

def local(clrev):

1070

"""Turn a changelog revnum into a local revnum.

1084

"""Turn a changelog revnum into a local revnum.

1071

1085

1072

The ellipsis dag is stored as revnums on the changelog,

1086

The ellipsis dag is stored as revnums on the changelog,

1073

but when we're producing ellipsis entries for

1087

but when we're producing ellipsis entries for

1074

non-changelog revlogs, we need to turn those numbers into

1088

non-changelog revlogs, we need to turn those numbers into

1075

something local. This does that for us, and during the

1089

something local. This does that for us, and during the

1076

changelog sending phase will also expand the stored

1090

changelog sending phase will also expand the stored

1077

mappings as needed.

1091

mappings as needed.

1078

"""

1092

"""

1079

if clrev == nullrev:

1093

if clrev == nullrev:

1080

return nullrev

1094

return nullrev

1081

1095

1082

if ischangelog:

1096

if ischangelog:

1083

# If we're doing the changelog, it's possible that we

1097

# If we're doing the changelog, it's possible that we

1084

# have a parent that is already on the client, and we

1098

# have a parent that is already on the client, and we

1085

# need to store some extra mapping information so that

1099

# need to store some extra mapping information so that

1086

# our contained ellipsis nodes will be able to resolve

1100

# our contained ellipsis nodes will be able to resolve

1087

# their parents.

1101

# their parents.

1088

if clrev not in self._clrevtolocalrev:

1102

if clrev not in self._clrevtolocalrev:

1089

clnode = store.node(clrev)

1103

clnode = store.node(clrev)

1090

self._clnodetorev[clnode] = clrev

1104

self._clnodetorev[clnode] = clrev

1091

return clrev

1105

return clrev

1092

1106

1093

# Walk the ellipsis-ized changelog breadth-first looking for a

1107

# Walk the ellipsis-ized changelog breadth-first looking for a

1094

# change that has been linked from the current revlog.

1108

# change that has been linked from the current revlog.

1095

#

1109

#

1096

# For a flat manifest revlog only a single step should be necessary

1110

# For a flat manifest revlog only a single step should be necessary

1097

# as all relevant changelog entries are relevant to the flat

1111

# as all relevant changelog entries are relevant to the flat

1098

# manifest.

1112

# manifest.

1099

#

1113

#

1100

# For a filelog or tree manifest dirlog however not every changelog

1114

# For a filelog or tree manifest dirlog however not every changelog

1101

# entry will have been relevant, so we need to skip some changelog

1115

# entry will have been relevant, so we need to skip some changelog

1102

# nodes even after ellipsis-izing.

1116

# nodes even after ellipsis-izing.

1103

walk = [clrev]

1117

walk = [clrev]

1104

while walk:

1118

while walk:

1105

p = walk[0]

1119

p = walk[0]

1106

walk = walk[1:]

1120

walk = walk[1:]

1107

if p in self._clrevtolocalrev:

1121

if p in self._clrevtolocalrev:

1108

return self._clrevtolocalrev[p]

1122

return self._clrevtolocalrev[p]

1109

elif p in self._fullnodes:

1123

elif p in self._fullnodes:

1110

walk.extend([pp for pp in self._repo.changelog.parentrevs(p)

1124

walk.extend([pp for pp in self._repo.changelog.parentrevs(p)

1111

if pp != nullrev])

1125

if pp != nullrev])

1112

elif p in self._precomputedellipsis:

1126

elif p in self._precomputedellipsis:

1113

walk.extend([pp for pp in self._precomputedellipsis[p]

1127

walk.extend([pp for pp in self._precomputedellipsis[p]

1114

if pp != nullrev])

1128

if pp != nullrev])

1115

else:

1129

else:

1116

# In this case, we've got an ellipsis with parents

1130

# In this case, we've got an ellipsis with parents

1117

# outside the current bundle (likely an

1131

# outside the current bundle (likely an

1118

# incremental pull). We "know" that we can use the

1132

# incremental pull). We "know" that we can use the

1119

# value of this same revlog at whatever revision

1133

# value of this same revlog at whatever revision

1120

# is pointed to by linknode. "Know" is in scare

1134

# is pointed to by linknode. "Know" is in scare

1121

# quotes because I haven't done enough examination

1135

# quotes because I haven't done enough examination

1122

# of edge cases to convince myself this is really

1136

# of edge cases to convince myself this is really

1123

# a fact - it works for all the (admittedly

1137

# a fact - it works for all the (admittedly

1124

# thorough) cases in our testsuite, but I would be

1138

# thorough) cases in our testsuite, but I would be

1125

# somewhat unsurprised to find a case in the wild

1139

# somewhat unsurprised to find a case in the wild

1126

# where this breaks down a bit. That said, I don't

1140

# where this breaks down a bit. That said, I don't

1127

# know if it would hurt anything.

1141

# know if it would hurt anything.

1128

for i in pycompat.xrange(rev, 0, -1):

1142

for i in pycompat.xrange(rev, 0, -1):

1129

if store.linkrev(i) == clrev:

1143

if store.linkrev(i) == clrev:

1130

return i

1144

return i

1131

# We failed to resolve a parent for this node, so

1145

# We failed to resolve a parent for this node, so

1132

# we crash the changegroup construction.

1146

# we crash the changegroup construction.

1133

raise error.Abort(

1147

raise error.Abort(

1134

'unable to resolve parent while packing %r %r'

1148

'unable to resolve parent while packing %r %r'

1135

' for changeset %r' % (store.indexfile, rev, clrev))

1149

' for changeset %r' % (store.indexfile, rev, clrev))

1136

1150

1137

return nullrev

1151

return nullrev

1138

1152

1139

if not linkparents or (

1153

if not linkparents or (

1140

store.parentrevs(rev) == (nullrev, nullrev)):

1154

store.parentrevs(rev) == (nullrev, nullrev)):

1141

p1, p2 = nullrev, nullrev

1155

p1, p2 = nullrev, nullrev

1142

elif len(linkparents) == 1:

1156

elif len(linkparents) == 1:

1143

p1, = sorted(local(p) for p in linkparents)

1157

p1, = sorted(local(p) for p in linkparents)

1144

p2 = nullrev

1158

p2 = nullrev

1145

else:

1159

else:

1146

p1, p2 = sorted(local(p) for p in linkparents)

1160

p1, p2 = sorted(local(p) for p in linkparents)

1147

1161

1148

n = store.node(rev)

1162

n = store.node(rev)

1149

p1n, p2n = store.node(p1), store.node(p2)

1163

p1n, p2n = store.node(p1), store.node(p2)

1150

flags = store.flags(rev)

1164

flags = store.flags(rev)

1151

flags |= revlog.REVIDX_ELLIPSIS

1165

flags |= revlog.REVIDX_ELLIPSIS

1152

1166

1153

# TODO: try and actually send deltas for ellipsis data blocks

1167

# TODO: try and actually send deltas for ellipsis data blocks

1154

data = store.revision(n)

1168

data = store.revision(n)

1155

diffheader = mdiff.trivialdiffheader(len(data))

1169

diffheader = mdiff.trivialdiffheader(len(data))

1156

1170

1157

return revisiondelta(

1171

return revisiondelta(

1158

node=n,

1172

node=n,

1159

p1node=p1n,

1173

p1node=p1n,

1160

p2node=p2n,

1174

p2node=p2n,

1161

basenode=nullid,

1175

basenode=nullid,

1162

linknode=linknode,

1176

linknode=linknode,

1163

flags=flags,

1177

flags=flags,

1164

deltachunks=(diffheader, data),

1178

deltachunks=(diffheader, data),

1165

)

1179

)

1166

1180

1167

def _deltaparentprev(store, rev, p1, p2, prev):

1181

def _deltaparentprev(store, rev, p1, p2, prev):

1168

"""Resolve a delta parent to the previous revision.

1182

"""Resolve a delta parent to the previous revision.

1169

1183

1170

Used for version 1 changegroups, which don't support generaldelta.

1184

Used for version 1 changegroups, which don't support generaldelta.

1171

"""

1185

"""

1172

return prev

1186

return prev

1173

1187

1174

def _deltaparentgeneraldelta(store, rev, p1, p2, prev):

1188

def _deltaparentgeneraldelta(store, rev, p1, p2, prev):

1175

"""Resolve a delta parent when general deltas are supported."""

1189

"""Resolve a delta parent when general deltas are supported."""

1176

dp = store.deltaparent(rev)

1190

dp = store.deltaparent(rev)

1177

if dp == nullrev and store.storedeltachains:

1191

if dp == nullrev and store.storedeltachains:

1178

# Avoid sending full revisions when delta parent is null. Pick prev

1192

# Avoid sending full revisions when delta parent is null. Pick prev

1179

# in that case. It's tempting to pick p1 in this case, as p1 will

1193

# in that case. It's tempting to pick p1 in this case, as p1 will

1180

# be smaller in the common case. However, computing a delta against

1194

# be smaller in the common case. However, computing a delta against

1181

# p1 may require resolving the raw text of p1, which could be

1195

# p1 may require resolving the raw text of p1, which could be

1182

# expensive. The revlog caches should have prev cached, meaning

1196

# expensive. The revlog caches should have prev cached, meaning

1183

# less CPU for changegroup generation. There is likely room to add

1197

# less CPU for changegroup generation. There is likely room to add

1184

# a flag and/or config option to control this behavior.

1198

# a flag and/or config option to control this behavior.

1185

base = prev

1199

base = prev

1186

elif dp == nullrev:

1200

elif dp == nullrev:

1187

# revlog is configured to use full snapshot for a reason,

1201

# revlog is configured to use full snapshot for a reason,

1188

# stick to full snapshot.

1202

# stick to full snapshot.

1189

base = nullrev

1203

base = nullrev

1190

elif dp not in (p1, p2, prev):

1204

elif dp not in (p1, p2, prev):

1191

# Pick prev when we can't be sure remote has the base revision.

1205

# Pick prev when we can't be sure remote has the base revision.

1192

return prev

1206

return prev

1193

else:

1207

else:

1194

base = dp

1208

base = dp

1195

1209

1196

if base != nullrev and not store.candelta(base, rev):

1210

if base != nullrev and not store.candelta(base, rev):

1197

base = nullrev

1211

base = nullrev

1198

1212

1199

return base

1213

return base

1200

1214

1201

def _deltaparentellipses(store, rev, p1, p2, prev):

1215

def _deltaparentellipses(store, rev, p1, p2, prev):

1202

"""Resolve a delta parent when in ellipses mode."""

1216

"""Resolve a delta parent when in ellipses mode."""

1203

# TODO: send better deltas when in narrow mode.

1217

# TODO: send better deltas when in narrow mode.

1204

#

1218

#

1205

# changegroup.group() loops over revisions to send,

1219

# changegroup.group() loops over revisions to send,

1206

# including revisions we'll skip. What this means is that

1220

# including revisions we'll skip. What this means is that

1207

# `prev` will be a potentially useless delta base for all

1221

# `prev` will be a potentially useless delta base for all

1208

# ellipsis nodes, as the client likely won't have it. In

1222

# ellipsis nodes, as the client likely won't have it. In

1209

# the future we should do bookkeeping about which nodes

1223

# the future we should do bookkeeping about which nodes

1210

# have been sent to the client, and try to be

1224

# have been sent to the client, and try to be

1211

# significantly smarter about delta bases. This is

1225

# significantly smarter about delta bases. This is

1212

# slightly tricky because this same code has to work for

1226

# slightly tricky because this same code has to work for

1213

# all revlogs, and we don't have the linkrev/linknode here.

1227

# all revlogs, and we don't have the linkrev/linknode here.

1214

return p1

1228

return p1

1215

1229

1216

def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,

1230

def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,

1217

shallow=False, ellipsisroots=None, fullnodes=None):

1231

shallow=False, ellipsisroots=None, fullnodes=None):

1218

builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(

1232

builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(

1219

d.node, d.p1node, d.p2node, d.linknode)

1233

d.node, d.p1node, d.p2node, d.linknode)

1220

1234

1221

return cgpacker(repo, filematcher, b'01',

1235

return cgpacker(repo, filematcher, b'01',

1222

deltaparentfn=_deltaparentprev,

1236

deltaparentfn=_deltaparentprev,

1223

allowreorder=None,

1237

allowreorder=None,

1224

builddeltaheader=builddeltaheader,

1238

builddeltaheader=builddeltaheader,

1225

manifestsend=b'',

1239

manifestsend=b'',

1226

bundlecaps=bundlecaps,

1240

bundlecaps=bundlecaps,

1227

ellipses=ellipses,

1241

ellipses=ellipses,

1228

shallow=shallow,

1242

shallow=shallow,

1229

ellipsisroots=ellipsisroots,

1243

ellipsisroots=ellipsisroots,

1230

fullnodes=fullnodes)

1244

fullnodes=fullnodes)

1231

1245

1232

def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,

1246

def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,

1233

shallow=False, ellipsisroots=None, fullnodes=None):

1247

shallow=False, ellipsisroots=None, fullnodes=None):

1234

builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(

1248

builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(

1235

d.node, d.p1node, d.p2node, d.basenode, d.linknode)

1249

d.node, d.p1node, d.p2node, d.basenode, d.linknode)

1236

1250

1237

# Since generaldelta is directly supported by cg2, reordering

1251

# Since generaldelta is directly supported by cg2, reordering

1238

# generally doesn't help, so we disable it by default (treating

1252

# generally doesn't help, so we disable it by default (treating

1239

# bundle.reorder=auto just like bundle.reorder=False).

1253

# bundle.reorder=auto just like bundle.reorder=False).

1240

return cgpacker(repo, filematcher, b'02',

1254

return cgpacker(repo, filematcher, b'02',

1241

deltaparentfn=_deltaparentgeneraldelta,

1255

deltaparentfn=_deltaparentgeneraldelta,

1242

allowreorder=False,

1256

allowreorder=False,

1243

builddeltaheader=builddeltaheader,

1257

builddeltaheader=builddeltaheader,

1244

manifestsend=b'',

1258

manifestsend=b'',

1245

bundlecaps=bundlecaps,

1259

bundlecaps=bundlecaps,

1246

ellipses=ellipses,

1260

ellipses=ellipses,

1247

shallow=shallow,

1261

shallow=shallow,

1248

ellipsisroots=ellipsisroots,

1262

ellipsisroots=ellipsisroots,

1249

fullnodes=fullnodes)

1263

fullnodes=fullnodes)

1250

1264

1251

def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,

1265

def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,

1252

shallow=False, ellipsisroots=None, fullnodes=None):

1266

shallow=False, ellipsisroots=None, fullnodes=None):

1253

builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(

1267

builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(

1254

d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)

1268

d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)

1255

1269

1256

deltaparentfn = (_deltaparentellipses if ellipses

1270

deltaparentfn = (_deltaparentellipses if ellipses

1257

else _deltaparentgeneraldelta)

1271

else _deltaparentgeneraldelta)

1258

1272

1259

return cgpacker(repo, filematcher, b'03',

1273

return cgpacker(repo, filematcher, b'03',

1260

deltaparentfn=deltaparentfn,

1274

deltaparentfn=deltaparentfn,

1261

allowreorder=False,

1275

allowreorder=False,

1262

builddeltaheader=builddeltaheader,

1276

builddeltaheader=builddeltaheader,

1263

manifestsend=closechunk(),

1277

manifestsend=closechunk(),

1264

bundlecaps=bundlecaps,

1278

bundlecaps=bundlecaps,

1265

ellipses=ellipses,

1279

ellipses=ellipses,

1266

shallow=shallow,

1280

shallow=shallow,

1267

ellipsisroots=ellipsisroots,

1281

ellipsisroots=ellipsisroots,

1268

fullnodes=fullnodes)

1282

fullnodes=fullnodes)

1269

1283

1270

_packermap = {'01': (_makecg1packer, cg1unpacker),

1284

_packermap = {'01': (_makecg1packer, cg1unpacker),

1271

# cg2 adds support for exchanging generaldelta

1285

# cg2 adds support for exchanging generaldelta

1272

'02': (_makecg2packer, cg2unpacker),

1286

'02': (_makecg2packer, cg2unpacker),

1273

# cg3 adds support for exchanging revlog flags and treemanifests

1287

# cg3 adds support for exchanging revlog flags and treemanifests

1274

'03': (_makecg3packer, cg3unpacker),

1288

'03': (_makecg3packer, cg3unpacker),

1275

}

1289

}

1276

1290

1277

def allsupportedversions(repo):

1291

def allsupportedversions(repo):

1278

versions = set(_packermap.keys())

1292

versions = set(_packermap.keys())

1279

if not (repo.ui.configbool('experimental', 'changegroup3') or

1293

if not (repo.ui.configbool('experimental', 'changegroup3') or

1280

repo.ui.configbool('experimental', 'treemanifest') or

1294

repo.ui.configbool('experimental', 'treemanifest') or

1281

'treemanifest' in repo.requirements):

1295

'treemanifest' in repo.requirements):

1282

versions.discard('03')

1296

versions.discard('03')

1283

return versions

1297

return versions

1284

1298

1285

# Changegroup versions that can be applied to the repo

1299

# Changegroup versions that can be applied to the repo

1286

def supportedincomingversions(repo):

1300

def supportedincomingversions(repo):

1287

return allsupportedversions(repo)

1301

return allsupportedversions(repo)

1288

1302

1289

# Changegroup versions that can be created from the repo

1303

# Changegroup versions that can be created from the repo

1290

def supportedoutgoingversions(repo):

1304

def supportedoutgoingversions(repo):

1291

versions = allsupportedversions(repo)

1305

versions = allsupportedversions(repo)

1292

if 'treemanifest' in repo.requirements:

1306

if 'treemanifest' in repo.requirements:

1293

# Versions 01 and 02 support only flat manifests and it's just too

1307

# Versions 01 and 02 support only flat manifests and it's just too

1294

# expensive to convert between the flat manifest and tree manifest on

1308

# expensive to convert between the flat manifest and tree manifest on

1295

# the fly. Since tree manifests are hashed differently, all of history

1309

# the fly. Since tree manifests are hashed differently, all of history

1296

# would have to be converted. Instead, we simply don't even pretend to

1310

# would have to be converted. Instead, we simply don't even pretend to

1297

# support versions 01 and 02.

1311

# support versions 01 and 02.

1298

versions.discard('01')

1312

versions.discard('01')

1299

versions.discard('02')

1313

versions.discard('02')

1300

if repository.NARROW_REQUIREMENT in repo.requirements:

1314

if repository.NARROW_REQUIREMENT in repo.requirements:

1301

# Versions 01 and 02 don't support revlog flags, and we need to

1315

# Versions 01 and 02 don't support revlog flags, and we need to

1302

# support that for stripping and unbundling to work.

1316

# support that for stripping and unbundling to work.

1303

versions.discard('01')

1317

versions.discard('01')

1304

versions.discard('02')

1318

versions.discard('02')

1305

if LFS_REQUIREMENT in repo.requirements:

1319

if LFS_REQUIREMENT in repo.requirements:

1306

# Versions 01 and 02 don't support revlog flags, and we need to

1320

# Versions 01 and 02 don't support revlog flags, and we need to

1307

# mark LFS entries with REVIDX_EXTSTORED.

1321

# mark LFS entries with REVIDX_EXTSTORED.

1308

versions.discard('01')

1322

versions.discard('01')

1309

versions.discard('02')

1323

versions.discard('02')

1310

1324

1311

return versions

1325

return versions

1312

1326

1313

def localversion(repo):

1327

def localversion(repo):

1314

# Finds the best version to use for bundles that are meant to be used

1328

# Finds the best version to use for bundles that are meant to be used

1315

# locally, such as those from strip and shelve, and temporary bundles.

1329

# locally, such as those from strip and shelve, and temporary bundles.

1316

return max(supportedoutgoingversions(repo))

1330

return max(supportedoutgoingversions(repo))

1317

1331

1318

def safeversion(repo):

1332

def safeversion(repo):

1319

# Finds the smallest version that it's safe to assume clients of the repo

1333

# Finds the smallest version that it's safe to assume clients of the repo

1320

# will support. For example, all hg versions that support generaldelta also

1334

# will support. For example, all hg versions that support generaldelta also

1321

# support changegroup 02.

1335

# support changegroup 02.

1322

versions = supportedoutgoingversions(repo)

1336

versions = supportedoutgoingversions(repo)

1323

if 'generaldelta' in repo.requirements:

1337

if 'generaldelta' in repo.requirements:

1324

versions.discard('01')

1338

versions.discard('01')

1325

assert versions

1339

assert versions

1326

return min(versions)

1340

return min(versions)

1327

1341

1328

def getbundler(version, repo, bundlecaps=None, filematcher=None,

1342

def getbundler(version, repo, bundlecaps=None, filematcher=None,

1329

ellipses=False, shallow=False, ellipsisroots=None,

1343

ellipses=False, shallow=False, ellipsisroots=None,

1330

fullnodes=None):

1344

fullnodes=None):

1331

assert version in supportedoutgoingversions(repo)

1345

assert version in supportedoutgoingversions(repo)

1332

1346

1333

if filematcher is None:

1347

if filematcher is None:

1334

filematcher = matchmod.alwaysmatcher(repo.root, '')

1348

filematcher = matchmod.alwaysmatcher(repo.root, '')

1335

1349

1336

if version == '01' and not filematcher.always():

1350

if version == '01' and not filematcher.always():

1337

raise error.ProgrammingError('version 01 changegroups do not support '

1351

raise error.ProgrammingError('version 01 changegroups do not support '

1338

'sparse file matchers')

1352

'sparse file matchers')

1339

1353

1340

if ellipses and version in (b'01', b'02'):

1354

if ellipses and version in (b'01', b'02'):

1341

raise error.Abort(

1355

raise error.Abort(

1342

_('ellipsis nodes require at least cg3 on client and server, '

1356

_('ellipsis nodes require at least cg3 on client and server, '

1343

'but negotiated version %s') % version)

1357

'but negotiated version %s') % version)

1344

1358

1345

# Requested files could include files not in the local store. So

1359

# Requested files could include files not in the local store. So

1346

# filter those out.

1360

# filter those out.

1347

filematcher = matchmod.intersectmatchers(repo.narrowmatch(),

1361

filematcher = matchmod.intersectmatchers(repo.narrowmatch(),

1348

filematcher)

1362

filematcher)

1349

1363

1350

fn = _packermap[version][0]

1364

fn = _packermap[version][0]

1351

return fn(repo, filematcher, bundlecaps, ellipses=ellipses,

1365

return fn(repo, filematcher, bundlecaps, ellipses=ellipses,

1352

shallow=shallow, ellipsisroots=ellipsisroots,

1366

shallow=shallow, ellipsisroots=ellipsisroots,

1353

fullnodes=fullnodes)

1367

fullnodes=fullnodes)

1354

1368

1355

def getunbundler(version, fh, alg, extras=None):

1369

def getunbundler(version, fh, alg, extras=None):

1356

return _packermap[version][1](fh, alg, extras=extras)

1370

return _packermap[version][1](fh, alg, extras=extras)

1357

1371

1358

def _changegroupinfo(repo, nodes, source):

1372

def _changegroupinfo(repo, nodes, source):

1359

if repo.ui.verbose or source == 'bundle':

1373

if repo.ui.verbose or source == 'bundle':

1360

repo.ui.status(_("%d changesets found\n") % len(nodes))

1374

repo.ui.status(_("%d changesets found\n") % len(nodes))

1361

if repo.ui.debugflag:

1375

if repo.ui.debugflag:

1362

repo.ui.debug("list of changesets:\n")

1376

repo.ui.debug("list of changesets:\n")

1363

for node in nodes:

1377

for node in nodes:

1364

repo.ui.debug("%s\n" % hex(node))

1378

repo.ui.debug("%s\n" % hex(node))

1365

1379

1366

def makechangegroup(repo, outgoing, version, source, fastpath=False,

1380

def makechangegroup(repo, outgoing, version, source, fastpath=False,

1367

bundlecaps=None):

1381

bundlecaps=None):

1368

cgstream = makestream(repo, outgoing, version, source,

1382

cgstream = makestream(repo, outgoing, version, source,

1369

fastpath=fastpath, bundlecaps=bundlecaps)

1383

fastpath=fastpath, bundlecaps=bundlecaps)

1370

return getunbundler(version, util.chunkbuffer(cgstream), None,

1384

return getunbundler(version, util.chunkbuffer(cgstream), None,

1371

{'clcount': len(outgoing.missing) })

1385

{'clcount': len(outgoing.missing) })

1372

1386

1373

def makestream(repo, outgoing, version, source, fastpath=False,

1387

def makestream(repo, outgoing, version, source, fastpath=False,

1374

bundlecaps=None, filematcher=None):

1388

bundlecaps=None, filematcher=None):

1375

bundler = getbundler(version, repo, bundlecaps=bundlecaps,

1389

bundler = getbundler(version, repo, bundlecaps=bundlecaps,

1376

filematcher=filematcher)

1390

filematcher=filematcher)

1377

1391

1378

repo = repo.unfiltered()

1392

repo = repo.unfiltered()

1379

commonrevs = outgoing.common

1393

commonrevs = outgoing.common

1380

csets = outgoing.missing

1394

csets = outgoing.missing

1381

heads = outgoing.missingheads

1395

heads = outgoing.missingheads

1382

# We go through the fast path if we get told to, or if all (unfiltered

1396

# We go through the fast path if we get told to, or if all (unfiltered

1383

# heads have been requested (since we then know there all linkrevs will

1397

# heads have been requested (since we then know there all linkrevs will

1384

# be pulled by the client).

1398

# be pulled by the client).

1385

heads.sort()

1399

heads.sort()

1386

fastpathlinkrev = fastpath or (

1400

fastpathlinkrev = fastpath or (

1387

repo.filtername is None and heads == sorted(repo.heads()))

1401

repo.filtername is None and heads == sorted(repo.heads()))

1388

1402

1389

repo.hook('preoutgoing', throw=True, source=source)

1403

repo.hook('preoutgoing', throw=True, source=source)

1390

_changegroupinfo(repo, csets, source)

1404

_changegroupinfo(repo, csets, source)

1391

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1405

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1392

1406

1393

def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):

1407

def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):

1394

revisions = 0

1408

revisions = 0

1395

files = 0

1409

files = 0

1396

progress = repo.ui.makeprogress(_('files'), unit=_('files'),

1410

progress = repo.ui.makeprogress(_('files'), unit=_('files'),

1397

total=expectedfiles)

1411

total=expectedfiles)

1398

for chunkdata in iter(source.filelogheader, {}):

1412

for chunkdata in iter(source.filelogheader, {}):

1399

files += 1

1413

files += 1

1400

f = chunkdata["filename"]

1414

f = chunkdata["filename"]

1401

repo.ui.debug("adding %s revisions\n" % f)

1415

repo.ui.debug("adding %s revisions\n" % f)

1402

progress.increment()

1416

progress.increment()

1403

fl = repo.file(f)

1417

fl = repo.file(f)

1404

o = len(fl)

1418

o = len(fl)

1405

try:

1419

try:

1406

deltas = source.deltaiter()

1420

deltas = source.deltaiter()

1407

if not fl.addgroup(deltas, revmap, trp):

1421

if not fl.addgroup(deltas, revmap, trp):

1408

raise error.Abort(_("received file revlog group is empty"))

1422

raise error.Abort(_("received file revlog group is empty"))

1409

except error.CensoredBaseError as e:

1423

except error.CensoredBaseError as e:

1410

raise error.Abort(_("received delta base is censored: %s") % e)

1424

raise error.Abort(_("received delta base is censored: %s") % e)

1411

revisions += len(fl) - o

1425

revisions += len(fl) - o

1412

if f in needfiles:

1426

if f in needfiles:

1413

needs = needfiles[f]

1427

needs = needfiles[f]

1414

for new in pycompat.xrange(o, len(fl)):

1428

for new in pycompat.xrange(o, len(fl)):

1415

n = fl.node(new)

1429

n = fl.node(new)

1416

if n in needs:

1430

if n in needs:

1417

needs.remove(n)

1431

needs.remove(n)

1418

else:

1432

else:

1419

raise error.Abort(

1433

raise error.Abort(

1420

_("received spurious file revlog entry"))

1434

_("received spurious file revlog entry"))

1421

if not needs:

1435

if not needs:

1422

del needfiles[f]

1436

del needfiles[f]

1423

progress.complete()

1437

progress.complete()

1424

1438

1425

for f, needs in needfiles.iteritems():

1439

for f, needs in needfiles.iteritems():

1426

fl = repo.file(f)

1440

fl = repo.file(f)

1427

for n in needs:

1441

for n in needs:

1428

try:

1442

try:

1429

fl.rev(n)

1443

fl.rev(n)

1430

except error.LookupError:

1444

except error.LookupError:

1431

raise error.Abort(

1445

raise error.Abort(

1432

_('missing file data for %s:%s - run hg verify') %

1446

_('missing file data for %s:%s - run hg verify') %

1433

(f, hex(n)))

1447

(f, hex(n)))

1434

1448

1435

return revisions, files

1449

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from .thirdparty import (
                 attr,
             )
             from . import (
                 dagutil,
                 error,
                 manifest,
                 match as matchmod,
                 mdiff,
                 phases,
                 pycompat,
                 repository,
                 revlog,
                 util,
             )
             from .utils import (
                 stringutil,
             )
             _CHANGEGROUPV1_DELTA_HEADER = struct.Struct("20s20s20s20s")
             _CHANGEGROUPV2_DELTA_HEADER = struct.Struct("20s20s20s20s20s")
             _CHANGEGROUPV3_DELTA_HEADER = struct.Struct(">20s20s20s20s20sH")
             LFS_REQUIREMENT = 'lfs'
             readexactly = util.readexactly
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def _fileheader(path):
                 """Obtain a changegroup chunk header for a named path."""
                 return chunkheader(len(path)) + path
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             # Increase default buffer size because default is usually
                             # small (4k is common on Linux).
                             fh = open(filename, "wb", 131072)
                     else:
                         fd, filename = pycompat.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, r"wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = deltaheader.size
                 version = '01'
                 _grouplistcount = 1 # One list of files after the manifests
                 def __init__(self, fh, alg, extras=None):
                     if alg is None:
                         alg = 'UN'
                     if alg not in util.compengines.supportedbundletypes:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     compengine = util.compengines.forbundletype(alg)
                     self._stream = compengine.decompressorreader(fh)
                     self._type = alg
                     self.extras = extras or {}
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None and self._type != 'UN'
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = self.deltaheader.unpack(headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
                     return (node, p1, p2, cs, deltabase, delta, flags)
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # For changegroup 1 and 2, we expect 3 parts: changelog, manifestlog,
                     # and a list of filelogs. For changegroup 3, we expect 4 parts:
                     # changelog, manifestlog, a list of tree manifestlogs, and a list of
                     # filelogs.
                     #
                     # Changelog and manifestlog parts are terminated with empty chunks. The
                     # tree and file parts are a list of entry sections. Each entry section
                     # is a series of chunks terminating in an empty chunk. The list of these
                     # entry sections is terminated in yet another empty chunk, so we know
                     # we've reached the end of the tree/file list when we reach an empty
                     # chunk that was proceeded by no non-empty chunks.
                     parts = 0
                     while parts < 2 + self._grouplistcount:
                         noentries = True
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 # The first two empty chunks represent the end of the
                                 # changelog and the manifestlog portions. The remaining
                                 # empty chunks represent either A) the end of individual
                                 # tree or file entries in the file list, or B) the end of
                                 # the entire list. It's the end of the entire list if there
                                 # were no entries (i.e. noentries is True).
                                 if parts < 2:
                                     parts += 1
                                 elif noentries:
                                     parts += 1
                                 break
                             noentries = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog):
                     self.callback = prog.increment
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     deltas = self.deltaiter()
                     repo.manifestlog.addgroup(deltas, revmap, trp)
                     prog.complete()
                     self.callback = None
                 def apply(self, repo, tr, srctype, url, targetphase=phases.draft,
                           expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     try:
                         # The transaction may already carry source information. In this
                         # case we use the top level data. We overwrite the argument
                         # because we need to use the top level value (if they exist)
                         # in this function.
                         srctype = tr.hookargs.setdefault('source', srctype)
                         url = tr.hookargs.setdefault('url', url)
                         repo.hook('prechangegroup',
                                   throw=True, **pycompat.strkwargs(tr.hookargs))
                         # write changelog data to temp files so concurrent readers
                         # will not see an inconsistent view
                         cl = repo.changelog
                         cl.delayupdate(tr)
                         oldheads = set(cl.heads())
                         trp = weakref.proxy(tr)
                         # pull off the changeset group
                         repo.ui.status(_("adding changesets\n"))
                         clstart = len(cl)
                         progress = repo.ui.makeprogress(_('changesets'), unit=_('chunks'),
                                                         total=expectedtotal)
                         self.callback = progress.increment
                         efiles = set()
                         def onchangelog(cl, node):
                             efiles.update(cl.readfiles(node))
                         self.changelogheader()
                         deltas = self.deltaiter()
                         cgnodes = cl.addgroup(deltas, csmap, trp, addrevisioncb=onchangelog)
                         efiles = len(efiles)
                         if not cgnodes:
                             repo.ui.develwarn('applied empty changegroup',
                                               config='warn-empty-changegroup')
                         clend = len(cl)
                         changesets = clend - clstart
                         progress.complete()
                         self.callback = None
                         # pull off the manifest group
                         repo.ui.status(_("adding manifests\n"))
                         # We know that we'll never have more manifests than we had
                         # changesets.
                         progress = repo.ui.makeprogress(_('manifests'), unit=_('chunks'),
                                                         total=changesets)
                         self._unpackmanifests(repo, revmap, trp, progress)
                         needfiles = {}
                         if repo.ui.configbool('server', 'validate'):
                             cl = repo.changelog
                             ml = repo.manifestlog
                             # validate incoming csets have their manifests
                             for cset in pycompat.xrange(clstart, clend):
                                 mfnode = cl.changelogrevision(cset).manifest
                                 mfest = ml[mfnode].readdelta()
                                 # store file cgnodes we must see
                                 for f, n in mfest.iteritems():
                                     needfiles.setdefault(f, set()).add(n)
                         # process the files
                         repo.ui.status(_("adding file changes\n"))
                         newrevs, newfiles = _addchangegroupfiles(
                             repo, self, revmap, trp, efiles, needfiles)
                         revisions += newrevs
                         files += newfiles
                         deltaheads = 0
                         if oldheads:
                             heads = cl.heads()
                             deltaheads = len(heads) - len(oldheads)
                             for h in heads:
                                 if h not in oldheads and repo[h].closesbranch():
                                     deltaheads -= 1
                         htext = ""
                         if deltaheads:
                             htext = _(" (%+d heads)") % deltaheads
                         repo.ui.status(_("added %d changesets"
                                          " with %d changes to %d files%s\n")
                                          % (changesets, revisions, files, htext))
                         repo.invalidatevolatilesets()
                         if changesets > 0:
                             if 'node' not in tr.hookargs:
                                 tr.hookargs['node'] = hex(cl.node(clstart))
                                 tr.hookargs['node_last'] = hex(cl.node(clend - 1))
                                 hookargs = dict(tr.hookargs)
                             else:
                                 hookargs = dict(tr.hookargs)
                                 hookargs['node'] = hex(cl.node(clstart))
                                 hookargs['node_last'] = hex(cl.node(clend - 1))
                             repo.hook('pretxnchangegroup',
                                       throw=True, **pycompat.strkwargs(hookargs))
                         added = [cl.node(r) for r in pycompat.xrange(clstart, clend)]
                         phaseall = None
                         if srctype in ('push', 'serve'):
                             # Old servers can not push the boundary themselves.
                             # New servers won't push the boundary if changeset already
                             # exists locally as secret
                             #
                             # We should not use added here but the list of all change in
                             # the bundle
                             if repo.publishing():
                                 targetphase = phaseall = phases.public
                             else:
                                 # closer target phase computation
                                 # Those changesets have been pushed from the
                                 # outside, their phases are going to be pushed
                                 # alongside. Therefor `targetphase` is
                                 # ignored.
                                 targetphase = phaseall = phases.draft
                         if added:
                             phases.registernew(repo, tr, targetphase, added)
                         if phaseall is not None:
                             phases.advanceboundary(repo, tr, phaseall, cgnodes)
                         if changesets > 0:
                             def runhooks():
                                 # These hooks run when the lock releases, not when the
                                 # transaction closes. So it's possible for the changelog
                                 # to have changed since we last saw it.
                                 if clstart >= len(repo):
                                     return
                                 repo.hook("changegroup", **pycompat.strkwargs(hookargs))
                                 for n in added:
                                     args = hookargs.copy()
                                     args['node'] = hex(n)
                                     del args['node_last']
                                     repo.hook("incoming", **pycompat.strkwargs(args))
                                 newheads = [h for h in repo.heads()
                                             if h not in oldheads]
                                 repo.ui.log("incoming",
                                             "%d incoming changes - new heads: %s\n",
                                             len(added),
                                             ', '.join([hex(c[:6]) for c in newheads]))
                             tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                             lambda tr: repo._afterlock(runhooks))
                     finally:
                         repo.ui.flush()
                     # never return 0 here:
                     if deltaheads < 0:
                         ret = deltaheads - 1
                     else:
                         ret = deltaheads + 1
                     return ret
                 def deltaiter(self):
                     """
                     returns an iterator of the deltas in this changegroup
                     Useful for passing to the underlying storage system to be stored.
                     """
                     chain = None
                     for chunkdata in iter(lambda: self.deltachunk(chain), {}):
                         # Chunkdata: (node, p1, p2, cs, deltabase, delta, flags)
                         yield chunkdata
                         chain = chunkdata[0]
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = deltaheader.size
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
             class cg3unpacker(cg2unpacker):
                 """Unpacker for cg3 streams.
                 cg3 streams add support for exchanging treemanifests and revlog
                 flags. It adds the revlog flags to the delta header and an empty chunk
                 separating manifests and files.
                 """
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 deltaheadersize = deltaheader.size
                 version = '03'
                 _grouplistcount = 2 # One list of manifests and one list of files
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs, flags = headertuple
                     return node, p1, p2, deltabase, cs, flags
                 def _unpackmanifests(self, repo, revmap, trp, prog):
                     super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog)
                     for chunkdata in iter(self.filelogheader, {}):
                         # If we get here, there are directory manifests in the changegroup
                         d = chunkdata["filename"]
                         repo.ui.debug("adding %s revisions\n" % d)
                         dirlog = repo.manifestlog._revlog.dirlog(d)
                         deltas = self.deltaiter()
                         if not dirlog.addgroup(deltas, revmap, trp):
                             raise error.Abort(_("received dir revlog group is empty"))
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             @attr.s(slots=True, frozen=True)
             class revisiondelta(object):
                 """Describes a delta entry in a changegroup.
                 Captured data is sufficient to serialize the delta into multiple
                 formats.
                 """
                 # 20 byte node of this revision.
                 node = attr.ib()
                 # 20 byte nodes of parent revisions.
                 p1node = attr.ib()
                 p2node = attr.ib()
                 # 20 byte node of node this delta is against.
                 basenode = attr.ib()
                 # 20 byte node of changeset revision this delta is associated with.
                 linknode = attr.ib()
                 # 2 bytes of flags to apply to revision data.
                 flags = attr.ib()
                 # Iterable of chunks holding raw delta data.
                 deltachunks = attr.ib()
+            def _sortnodesnormal(store, nodes, reorder):
+                """Sort nodes for changegroup generation and turn into revnums."""
+                # for generaldelta revlogs, we linearize the revs; this will both be
+                # much quicker and generate a much smaller bundle
+                if (store._generaldelta and reorder is None) or reorder:
+                    dag = dagutil.revlogdag(store)
+                    return dag.linearize(set(store.rev(n) for n in nodes))
+                else:
+                    return sorted([store.rev(n) for n in nodes])
+            def _sortnodesellipsis(store, nodes, clnodetorev, lookup):
+                """Sort nodes for changegroup generation and turn into revnums."""
+                # Ellipses serving mode.
+                #
+                # In a perfect world, we'd generate better ellipsis-ified graphs
+                # for non-changelog revlogs. In practice, we haven't started doing
+                # that yet, so the resulting DAGs for the manifestlog and filelogs
+                # are actually full of bogus parentage on all the ellipsis
+                # nodes. This has the side effect that, while the contents are
+                # correct, the individual DAGs might be completely out of whack in
+                # a case like 882681bc3166 and its ancestors (back about 10
+                # revisions or so) in the main hg repo.
+                #
+                # The one invariant we *know* holds is that the new (potentially
+                # bogus) DAG shape will be valid if we order the nodes in the
+                # order that they're introduced in dramatis personae by the
+                # changelog, so what we do is we sort the non-changelog histories
+                # by the order in which they are used by the changelog.
+                key = lambda n: clnodetorev[lookup(n)]
+                return [store.rev(n) for n in sorted(nodes, key=key)]
             class cgpacker(object):
                 def __init__(self, repo, filematcher, version, allowreorder,
                              deltaparentfn, builddeltaheader, manifestsend,
                              bundlecaps=None, ellipses=False,
                              shallow=False, ellipsisroots=None, fullnodes=None):
                     """Given a source repo, construct a bundler.
                     filematcher is a matcher that matches on files to include in the
                     changegroup. Used to facilitate sparse changegroups.
                     allowreorder controls whether reordering of revisions is allowed.
                     This value is used when ``bundle.reorder`` is ``auto`` or isn't
                     set.
                     deltaparentfn is a callable that resolves the delta parent for
                     a specific revision.
                     builddeltaheader is a callable that constructs the header for a group
                     delta.
                     manifestsend is a chunk to send after manifests have been fully emitted.
                     ellipses indicates whether ellipsis serving mode is enabled.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle. While bundlecaps is
                     unused in core Mercurial, extensions rely on this feature to communicate
                     capabilities to customize the changegroup packer.
                     shallow indicates whether shallow data might be sent. The packer may
                     need to pack file contents not introduced by the changes being packed.
                     fullnodes is the list of nodes which should not be ellipsis nodes. We
                     store this rather than the set of nodes that should be ellipsis because
                     for very large histories we expect this to be significantly smaller.
                     """
                     assert filematcher
                     self._filematcher = filematcher
                     self.version = version
                     self._deltaparentfn = deltaparentfn
                     self._builddeltaheader = builddeltaheader
                     self._manifestsend = manifestsend
                     self._ellipses = ellipses
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     self._isshallow = shallow
                     self._fullnodes = fullnodes
                     # Maps ellipsis revs to their roots at the changelog level.
                     self._precomputedellipsis = ellipsisroots
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder')
                     if reorder == 'auto':
                         self._reorder = allowreorder
                     else:
                         self._reorder = stringutil.parsebool(reorder)
                     self._repo = repo
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                     # Maps CL revs to per-revlog revisions. Cleared in close() at
                     # the end of each group.
                     self._clrevtolocalrev = {}
                     self._nextclrevtolocalrev = {}
                     # Maps changelog nodes to changelog revs. Filled in once
                     # during changelog stage and then left unmodified.
                     self._clnodetorev = {}
                 def _close(self):
                     # Ellipses serving mode.
                     self._clrevtolocalrev.clear()
                     if self._nextclrevtolocalrev is not None:
                         self._clrevtolocalrev = self._nextclrevtolocalrev
                         self._nextclrevtolocalrev = None
                     return closechunk()
-                # Extracted both for clarity and for overriding in extensions.
+                def group(self, revs, store, ischangelog, lookup, units=None):
-                def _sortgroup(self, store, ischangelog, nodelist, lookup):
-                    """Sort nodes for change group and turn them into revnums."""
-                    # Ellipses serving mode.
-                    # In a perfect world, we'd generate better ellipsis-ified graphs
-                    # for non-changelog revlogs. In practice, we haven't started doing
-                    # that yet, so the resulting DAGs for the manifestlog and filelogs
-                    # are actually full of bogus parentage on all the ellipsis
-                    # nodes. This has the side effect that, while the contents are
-                    # correct, the individual DAGs might be completely out of whack in
-                    # a case like 882681bc3166 and its ancestors (back about 10
-                    # revisions or so) in the main hg repo.
-                    # The one invariant we *know* holds is that the new (potentially
-                    # bogus) DAG shape will be valid if we order the nodes in the
-                    # order that they're introduced in dramatis personae by the
-                    # changelog, so what we do is we sort the non-changelog histories
-                    # by the order in which they are used by the changelog.
-                    if self._ellipses and not ischangelog:
-                        key = lambda n: self._clnodetorev[lookup(n)]
-                        return [store.rev(n) for n in sorted(nodelist, key=key)]
-                    # for generaldelta revlogs, we linearize the revs; this will both be
-                    # much quicker and generate a much smaller bundle
-                    if (store._generaldelta and self._reorder is None) or self._reorder:
-                        dag = dagutil.revlogdag(store)
-                        return dag.linearize(set(store.rev(n) for n in nodelist))
-                    else:
-                        return sorted([store.rev(n) for n in nodelist])
-                def group(self, nodelist, store, ischangelog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
-                    if len(nodelist) == 0:
+                    if len(revs) == 0:
                         yield self._close()
                         return
-                    revs = self._sortgroup(store, ischangelog, nodelist, lookup)
                     # add the parent of the first rev
                     p = store.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     progress = None
                     if units is not None:
                         progress = self._repo.ui.makeprogress(_('bundling'), unit=units,
                                                               total=(len(revs) - 1))
                     for r in pycompat.xrange(len(revs) - 1):
                         if progress:
                             progress.update(r + 1)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(store.node(curr))
                         for c in self._revchunk(store, ischangelog, curr, prev, linknode):
                             yield c
                     if progress:
                         progress.complete()
                     yield self._close()
                 # filter any nodes that claim to be part of the known set
                 def _prune(self, store, missing, commonrevs):
                     # TODO this violates storage abstraction for manifests.
                     if isinstance(store, manifest.manifestrevlog):
                         if not self._filematcher.visitdir(store._dir[:-1] or '.'):
                             return []
                     rr, rl = store.rev, store.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
-                def _packmanifests(self, dir, mfnodes, lookuplinknode):
+                def _packmanifests(self, dir, dirlog, revs, lookuplinknode):
                     """Pack manifests into a changegroup stream.
                     Encodes the directory name in the output so multiple manifests
                     can be sent. Multiple manifests is not supported by cg1 and cg2.
                     """
                     if dir:
                         assert self.version == b'03'
                         yield _fileheader(dir)
-                    # TODO violates storage abstractions by assuming revlogs.
+                    for chunk in self.group(revs, dirlog, False, lookuplinknode,
-                    dirlog = self._repo.manifestlog._revlog.dirlog(dir)
-                    for chunk in self.group(mfnodes, dirlog, False, lookuplinknode,
                                             units=_('manifests')):
                         yield chunk
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     """Yield a sequence of changegroup byte chunks."""
                     repo = self._repo
                     cl = repo.changelog
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     clstate, chunks = self._generatechangelog(cl, clnodes)
                     for chunk in chunks:
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     clrevorder = clstate['clrevorder']
                     mfs = clstate['mfs']
                     changedfiles = clstate['changedfiles']
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Treemanifests don't work correctly with fastpathlinkrev
                     # either, because we don't discover which directory nodes to
                     # send along with files. This could probably be fixed.
                     fastpathlinkrev = fastpathlinkrev and (
                         'treemanifest' not in repo.requirements)
                     fnodes = {}  # needed file nodes
                     for chunk in self.generatemanifests(commonrevs, clrevorder,
                             fastpathlinkrev, mfs, fnodes, source):
                         yield chunk
                     if self._ellipses:
                         mfdicts = None
                         if self._isshallow:
                             mfdicts = [(self._repo.manifestlog[n].read(), lr)
                                        for (n, lr) in mfs.iteritems()]
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     if not fastpathlinkrev:
                         def linknodes(unused, fname):
                             return fnodes.get(fname, {})
                     else:
                         cln = cl.node
                         def linknodes(filerevlog, fname):
                             llr = filerevlog.linkrev
                             fln = filerevlog.node
                             revs = ((r, llr(r)) for r in filerevlog)
                             return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
                     if self._ellipses:
                         # We need to pass the mfdicts variable down into
                         # generatefiles(), but more than one command might have
                         # wrapped generatefiles so we can't modify the function
                         # signature. Instead, we pass the data to ourselves using an
                         # instance attribute. I'm sorry.
                         self._mfdicts = mfdicts
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self._close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 def _generatechangelog(self, cl, nodes):
                     """Generate data for changelog chunks.
                     Returns a 2-tuple of a dict containing state and an iterable of
                     byte chunks. The state will not be fully populated until the
                     chunk stream has been fully consumed.
                     """
                     clrevorder = {}
                     mfs = {} # needed manifests
                     mfl = self._repo.manifestlog
                     # TODO violates storage abstraction.
                     mfrevlog = mfl._revlog
                     changedfiles = set()
                     # Callback for the changelog, used to collect changed files and
                     # manifest nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         if self._ellipses:
                             # Only update mfs if x is going to be sent. Otherwise we
                             # end up with bogus linkrevs specified for manifests and
                             # we skip some manifest nodes that we should otherwise
                             # have sent.
                             if (x in self._fullnodes
                                 or cl.rev(x) in self._precomputedellipsis):
                                 n = c[0]
                                 # Record the first changeset introducing this manifest
                                 # version.
                                 mfs.setdefault(n, x)
                                 # Set this narrow-specific dict so we have the lowest
                                 # manifest revnum to look up for this cl revnum. (Part of
                                 # mapping changelog ellipsis parents to manifest ellipsis
                                 # parents)
                                 self._nextclrevtolocalrev.setdefault(cl.rev(x),
                                                                      mfrevlog.rev(n))
                             # We can't trust the changed files list in the changeset if the
                             # client requested a shallow clone.
                             if self._isshallow:
                                 changedfiles.update(mfl[c[0]].read().keys())
                             else:
                                 changedfiles.update(c[3])
                         else:
                             n = c[0]
                             # record the first changeset introducing this manifest version
                             mfs.setdefault(n, x)
                             # Record a complete list of potentially-changed files in
                             # this manifest.
                             changedfiles.update(c[3])
                         return x
+                    # Changelog doesn't benefit from reordering revisions. So send out
+                    # revisions in store order.
+                    revs = sorted(cl.rev(n) for n in nodes)
                     state = {
                         'clrevorder': clrevorder,
                         'mfs': mfs,
                         'changedfiles': changedfiles,
                     }
-                    gen = self.group(nodes, cl, True, lookupcl, units=_('changesets'))
+                    gen = self.group(revs, cl, True, lookupcl, units=_('changesets'))
                     return state, gen
                 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
                                       fnodes, source):
                     """Returns an iterator of changegroup chunks containing manifests.
                     `source` is unused here, but is used by extensions like remotefilelog to
                     change what is sent based in pulls vs pushes, etc.
                     """
                     repo = self._repo
                     mfl = repo.manifestlog
                     dirlog = mfl._revlog.dirlog
                     tmfnodes = {'': mfs}
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def makelookupmflinknode(dir, nodes):
                         if fastpathlinkrev:
                             assert not dir
                             return mfs.__getitem__
                         def lookupmflinknode(x):
                             """Callback for looking up the linknode for manifests.
                             Returns the linkrev node for the specified manifest.
                             SIDE EFFECT:
 ) fclnodes gets populated with the list of relevant
                                file nodes if we're not using fastpathlinkrev
 ) When treemanifests are in use, collects treemanifest nodes
                                to send
                             Note that this means manifests must be completely sent to
                             the client before you can trust the list of files and
                             treemanifests to send.
                             """
                             clnode = nodes[x]
                             mdata = mfl.get(dir, x).readfast(shallow=True)
                             for p, n, fl in mdata.iterentries():
                                 if fl == 't': # subdirectory manifest
                                     subdir = dir + p + '/'
                                     tmfclnodes = tmfnodes.setdefault(subdir, {})
                                     tmfclnode = tmfclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[tmfclnode]:
                                         tmfclnodes[n] = clnode
                                 else:
                                     f = dir + p
                                     fclnodes = fnodes.setdefault(f, {})
                                     fclnode = fclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[fclnode]:
                                         fclnodes[n] = clnode
                             return clnode
                         return lookupmflinknode
                     size = 0
                     while tmfnodes:
                         dir, nodes = tmfnodes.popitem()
-                        prunednodes = self._prune(dirlog(dir), nodes, commonrevs)
+                        store = dirlog(dir)
+                        prunednodes = self._prune(store, nodes, commonrevs)
                         if not dir or prunednodes:
-                            for x in self._packmanifests(dir, prunednodes,
+                            lookupfn = makelookupmflinknode(dir, nodes)
-                                                         makelookupmflinknode(dir, nodes)):
+                            if self._ellipses:
+                                revs = _sortnodesellipsis(store, prunednodes,
+                                                          self._clnodetorev, lookupfn)
+                            else:
+                                revs = _sortnodesnormal(store, prunednodes,
+                                                        self._reorder)
+                            for x in self._packmanifests(dir, store, revs, lookupfn):
                                 size += len(x)
                                 yield x
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                     yield self._manifestsend
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     changedfiles = list(filter(self._filematcher, changedfiles))
                     if self._isshallow:
                         # See comment in generate() for why this sadness is a thing.
                         mfdicts = self._mfdicts
                         del self._mfdicts
                         # In a shallow clone, the linknodes callback needs to also include
                         # those file nodes that are in the manifests we sent but weren't
                         # introduced by those manifests.
                         commonctxs = [self._repo[c] for c in commonrevs]
                         oldlinknodes = linknodes
                         clrev = self._repo.changelog.rev
                         # Defining this function has a side-effect of overriding the
                         # function of the same name that was passed in as an argument.
                         # TODO have caller pass in appropriate function.
                         def linknodes(flog, fname):
                             for c in commonctxs:
                                 try:
                                     fnode = c.filenode(fname)
                                     self._clrevtolocalrev[c.rev()] = flog.rev(fnode)
                                 except error.ManifestLookupError:
                                     pass
                             links = oldlinknodes(flog, fname)
                             if len(links) != len(mfdicts):
                                 for mf, lr in mfdicts:
                                     fnode = mf.get(fname, None)
                                     if fnode in links:
                                         links[fnode] = min(links[fnode], lr, key=clrev)
                                     elif fnode:
                                         links[fnode] = lr
                             return links
                     return self._generatefiles(changedfiles, linknodes, commonrevs, source)
                 def _generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = repo.ui.makeprogress(_('bundling'), unit=_('files'),
                                                     total=len(changedfiles))
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing file data for %s") %
                                               fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self._prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
+                            if self._ellipses:
+                                revs = _sortnodesellipsis(filerevlog, filenodes,
+                                                          self._clnodetorev, lookupfilelog)
+                            else:
+                                revs = _sortnodesnormal(filerevlog, filenodes,
+                                                        self._reorder)
                             progress.update(i + 1, item=fname)
                             h = _fileheader(fname)
                             size = len(h)
                             yield h
-                            for chunk in self.group(filenodes, filerevlog, False,
+                            for chunk in self.group(revs, filerevlog, False, lookupfilelog):
-                                                    lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress.complete()
                 def _revchunk(self, store, ischangelog, rev, prev, linknode):
                     if self._ellipses:
                         fn = self._revisiondeltanarrow
                     else:
                         fn = self._revisiondeltanormal
                     delta = fn(store, ischangelog, rev, prev, linknode)
                     if not delta:
                         return
                     meta = self._builddeltaheader(delta)
                     l = len(meta) + sum(len(x) for x in delta.deltachunks)
                     yield chunkheader(l)
                     yield meta
                     for x in delta.deltachunks:
                         yield x
                 def _revisiondeltanormal(self, store, ischangelog, rev, prev, linknode):
                     node = store.node(rev)
                     p1, p2 = store.parentrevs(rev)
                     base = self._deltaparentfn(store, rev, p1, p2, prev)
                     prefix = ''
                     if store.iscensored(base) or store.iscensored(rev):
                         try:
                             delta = store.revision(node, raw=True)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = store.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = store.revision(node, raw=True)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = store.revdiff(base, rev)
                     p1n, p2n = store.parents(node)
                     return revisiondelta(
                         node=node,
                         p1node=p1n,
                         p2node=p2n,
                         basenode=store.node(base),
                         linknode=linknode,
                         flags=store.flags(rev),
                         deltachunks=(prefix, delta),
                     )
                 def _revisiondeltanarrow(self, store, ischangelog, rev, prev, linknode):
                     # build up some mapping information that's useful later. See
                     # the local() nested function below.
                     if ischangelog:
                         self._clnodetorev[linknode] = rev
                         linkrev = rev
                         self._clrevtolocalrev[linkrev] = rev
                     else:
                         linkrev = self._clnodetorev[linknode]
                         self._clrevtolocalrev[linkrev] = rev
                     # This is a node to send in full, because the changeset it
                     # corresponds to was a full changeset.
                     if linknode in self._fullnodes:
                         return self._revisiondeltanormal(store, ischangelog, rev, prev,
                                                          linknode)
                     # At this point, a node can either be one we should skip or an
                     # ellipsis. If it's not an ellipsis, bail immediately.
                     if linkrev not in self._precomputedellipsis:
                         return
                     linkparents = self._precomputedellipsis[linkrev]
                     def local(clrev):
                         """Turn a changelog revnum into a local revnum.
                         The ellipsis dag is stored as revnums on the changelog,
                         but when we're producing ellipsis entries for
                         non-changelog revlogs, we need to turn those numbers into
                         something local. This does that for us, and during the
                         changelog sending phase will also expand the stored
                         mappings as needed.
                         """
                         if clrev == nullrev:
                             return nullrev
                         if ischangelog:
                             # If we're doing the changelog, it's possible that we
                             # have a parent that is already on the client, and we
                             # need to store some extra mapping information so that
                             # our contained ellipsis nodes will be able to resolve
                             # their parents.
                             if clrev not in self._clrevtolocalrev:
                                 clnode = store.node(clrev)
                                 self._clnodetorev[clnode] = clrev
                             return clrev
                         # Walk the ellipsis-ized changelog breadth-first looking for a
                         # change that has been linked from the current revlog.
                         #
                         # For a flat manifest revlog only a single step should be necessary
                         # as all relevant changelog entries are relevant to the flat
                         # manifest.
                         #
                         # For a filelog or tree manifest dirlog however not every changelog
                         # entry will have been relevant, so we need to skip some changelog
                         # nodes even after ellipsis-izing.
                         walk = [clrev]
                         while walk:
                             p = walk[0]
                             walk = walk[1:]
                             if p in self._clrevtolocalrev:
                                 return self._clrevtolocalrev[p]
                             elif p in self._fullnodes:
                                 walk.extend([pp for pp in self._repo.changelog.parentrevs(p)
                                                 if pp != nullrev])
                             elif p in self._precomputedellipsis:
                                 walk.extend([pp for pp in self._precomputedellipsis[p]
                                                 if pp != nullrev])
                             else:
                                 # In this case, we've got an ellipsis with parents
                                 # outside the current bundle (likely an
                                 # incremental pull). We "know" that we can use the
                                 # value of this same revlog at whatever revision
                                 # is pointed to by linknode. "Know" is in scare
                                 # quotes because I haven't done enough examination
                                 # of edge cases to convince myself this is really
                                 # a fact - it works for all the (admittedly
                                 # thorough) cases in our testsuite, but I would be
                                 # somewhat unsurprised to find a case in the wild
                                 # where this breaks down a bit. That said, I don't
                                 # know if it would hurt anything.
                                 for i in pycompat.xrange(rev, 0, -1):
                                     if store.linkrev(i) == clrev:
                                         return i
                                 # We failed to resolve a parent for this node, so
                                 # we crash the changegroup construction.
                                 raise error.Abort(
                                     'unable to resolve parent while packing %r %r'
                                     ' for changeset %r' % (store.indexfile, rev, clrev))
                         return nullrev
                     if not linkparents or (
                         store.parentrevs(rev) == (nullrev, nullrev)):
                         p1, p2 = nullrev, nullrev
                     elif len(linkparents) == 1:
                         p1, = sorted(local(p) for p in linkparents)
                         p2 = nullrev
                     else:
                         p1, p2 = sorted(local(p) for p in linkparents)
                     n = store.node(rev)
                     p1n, p2n = store.node(p1), store.node(p2)
                     flags = store.flags(rev)
                     flags |= revlog.REVIDX_ELLIPSIS
                     # TODO: try and actually send deltas for ellipsis data blocks
                     data = store.revision(n)
                     diffheader = mdiff.trivialdiffheader(len(data))
                     return revisiondelta(
                         node=n,
                         p1node=p1n,
                         p2node=p2n,
                         basenode=nullid,
                         linknode=linknode,
                         flags=flags,
                         deltachunks=(diffheader, data),
                     )
             def _deltaparentprev(store, rev, p1, p2, prev):
                 """Resolve a delta parent to the previous revision.
                 Used for version 1 changegroups, which don't support generaldelta.
                 """
                 return prev
             def _deltaparentgeneraldelta(store, rev, p1, p2, prev):
                 """Resolve a delta parent when general deltas are supported."""
                 dp = store.deltaparent(rev)
                 if dp == nullrev and store.storedeltachains:
                     # Avoid sending full revisions when delta parent is null. Pick prev
                     # in that case. It's tempting to pick p1 in this case, as p1 will
                     # be smaller in the common case. However, computing a delta against
                     # p1 may require resolving the raw text of p1, which could be
                     # expensive. The revlog caches should have prev cached, meaning
                     # less CPU for changegroup generation. There is likely room to add
                     # a flag and/or config option to control this behavior.
                     base = prev
                 elif dp == nullrev:
                     # revlog is configured to use full snapshot for a reason,
                     # stick to full snapshot.
                     base = nullrev
                 elif dp not in (p1, p2, prev):
                     # Pick prev when we can't be sure remote has the base revision.
                     return prev
                 else:
                     base = dp
                 if base != nullrev and not store.candelta(base, rev):
                     base = nullrev
                 return base
             def _deltaparentellipses(store, rev, p1, p2, prev):
                 """Resolve a delta parent when in ellipses mode."""
                 # TODO: send better deltas when in narrow mode.
                 #
                 # changegroup.group() loops over revisions to send,
                 # including revisions we'll skip. What this means is that
                 # `prev` will be a potentially useless delta base for all
                 # ellipsis nodes, as the client likely won't have it. In
                 # the future we should do bookkeeping about which nodes
                 # have been sent to the client, and try to be
                 # significantly smarter about delta bases. This is
                 # slightly tricky because this same code has to work for
                 # all revlogs, and we don't have the linkrev/linknode here.
                 return p1
             def _makecg1packer(repo, filematcher, bundlecaps, ellipses=False,
                                shallow=False, ellipsisroots=None, fullnodes=None):
                 builddeltaheader = lambda d: _CHANGEGROUPV1_DELTA_HEADER.pack(
                     d.node, d.p1node, d.p2node, d.linknode)
                 return cgpacker(repo, filematcher, b'01',
                                 deltaparentfn=_deltaparentprev,
                                 allowreorder=None,
                                 builddeltaheader=builddeltaheader,
                                 manifestsend=b'',
                                 bundlecaps=bundlecaps,
                                 ellipses=ellipses,
                                 shallow=shallow,
                                 ellipsisroots=ellipsisroots,
                                 fullnodes=fullnodes)
             def _makecg2packer(repo, filematcher, bundlecaps, ellipses=False,
                                shallow=False, ellipsisroots=None, fullnodes=None):
                 builddeltaheader = lambda d: _CHANGEGROUPV2_DELTA_HEADER.pack(
                     d.node, d.p1node, d.p2node, d.basenode, d.linknode)
                 # Since generaldelta is directly supported by cg2, reordering
                 # generally doesn't help, so we disable it by default (treating
                 # bundle.reorder=auto just like bundle.reorder=False).
                 return cgpacker(repo, filematcher, b'02',
                                 deltaparentfn=_deltaparentgeneraldelta,
                                 allowreorder=False,
                                 builddeltaheader=builddeltaheader,
                                 manifestsend=b'',
                                 bundlecaps=bundlecaps,
                                 ellipses=ellipses,
                                 shallow=shallow,
                                 ellipsisroots=ellipsisroots,
                                 fullnodes=fullnodes)
             def _makecg3packer(repo, filematcher, bundlecaps, ellipses=False,
                                shallow=False, ellipsisroots=None, fullnodes=None):
                 builddeltaheader = lambda d: _CHANGEGROUPV3_DELTA_HEADER.pack(
                     d.node, d.p1node, d.p2node, d.basenode, d.linknode, d.flags)
                 deltaparentfn = (_deltaparentellipses if ellipses
                                  else _deltaparentgeneraldelta)
                 return cgpacker(repo, filematcher, b'03',
                                 deltaparentfn=deltaparentfn,
                                 allowreorder=False,
                                 builddeltaheader=builddeltaheader,
                                 manifestsend=closechunk(),
                                 bundlecaps=bundlecaps,
                                 ellipses=ellipses,
                                 shallow=shallow,
                                 ellipsisroots=ellipsisroots,
                                 fullnodes=fullnodes)
             _packermap = {'01': (_makecg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (_makecg2packer, cg2unpacker),
                          # cg3 adds support for exchanging revlog flags and treemanifests
                          '03': (_makecg3packer, cg3unpacker),
             }
             def allsupportedversions(repo):
                 versions = set(_packermap.keys())
                 if not (repo.ui.configbool('experimental', 'changegroup3') or
                         repo.ui.configbool('experimental', 'treemanifest') or
                         'treemanifest' in repo.requirements):
                     versions.discard('03')
                 return versions
             # Changegroup versions that can be applied to the repo
             def supportedincomingversions(repo):
                 return allsupportedversions(repo)
             # Changegroup versions that can be created from the repo
             def supportedoutgoingversions(repo):
                 versions = allsupportedversions(repo)
                 if 'treemanifest' in repo.requirements:
                     # Versions 01 and 02 support only flat manifests and it's just too
                     # expensive to convert between the flat manifest and tree manifest on
                     # the fly. Since tree manifests are hashed differently, all of history
                     # would have to be converted. Instead, we simply don't even pretend to
                     # support versions 01 and 02.
                     versions.discard('01')
                     versions.discard('02')
                 if repository.NARROW_REQUIREMENT in repo.requirements:
                     # Versions 01 and 02 don't support revlog flags, and we need to
                     # support that for stripping and unbundling to work.
                     versions.discard('01')
                     versions.discard('02')
                 if LFS_REQUIREMENT in repo.requirements:
                     # Versions 01 and 02 don't support revlog flags, and we need to
                     # mark LFS entries with REVIDX_EXTSTORED.
                     versions.discard('01')
                     versions.discard('02')
                 return versions
             def localversion(repo):
                 # Finds the best version to use for bundles that are meant to be used
                 # locally, such as those from strip and shelve, and temporary bundles.
                 return max(supportedoutgoingversions(repo))
             def safeversion(repo):
                 # Finds the smallest version that it's safe to assume clients of the repo
                 # will support. For example, all hg versions that support generaldelta also
                 # support changegroup 02.
                 versions = supportedoutgoingversions(repo)
                 if 'generaldelta' in repo.requirements:
                     versions.discard('01')
                 assert versions
                 return min(versions)
             def getbundler(version, repo, bundlecaps=None, filematcher=None,
                            ellipses=False, shallow=False, ellipsisroots=None,
                            fullnodes=None):
                 assert version in supportedoutgoingversions(repo)
                 if filematcher is None:
                     filematcher = matchmod.alwaysmatcher(repo.root, '')
                 if version == '01' and not filematcher.always():
                     raise error.ProgrammingError('version 01 changegroups do not support '
                                                  'sparse file matchers')
                 if ellipses and version in (b'01', b'02'):
                     raise error.Abort(
                         _('ellipsis nodes require at least cg3 on client and server, '
                           'but negotiated version %s') % version)
                 # Requested files could include files not in the local store. So
                 # filter those out.
                 filematcher = matchmod.intersectmatchers(repo.narrowmatch(),
                                                          filematcher)
                 fn = _packermap[version][0]
                 return fn(repo, filematcher, bundlecaps, ellipses=ellipses,
                           shallow=shallow, ellipsisroots=ellipsisroots,
                           fullnodes=fullnodes)
             def getunbundler(version, fh, alg, extras=None):
                 return _packermap[version][1](fh, alg, extras=extras)
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def makechangegroup(repo, outgoing, version, source, fastpath=False,
                                 bundlecaps=None):
                 cgstream = makestream(repo, outgoing, version, source,
                                       fastpath=fastpath, bundlecaps=bundlecaps)
                 return getunbundler(version, util.chunkbuffer(cgstream), None,
                                     {'clcount': len(outgoing.missing) })
             def makestream(repo, outgoing, version, source, fastpath=False,
                            bundlecaps=None, filematcher=None):
                 bundler = getbundler(version, repo, bundlecaps=bundlecaps,
                                      filematcher=filematcher)
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def _addchangegroupfiles(repo, source, revmap, trp, expectedfiles, needfiles):
                 revisions = 0
                 files = 0
                 progress = repo.ui.makeprogress(_('files'), unit=_('files'),
                                                 total=expectedfiles)
                 for chunkdata in iter(source.filelogheader, {}):
                     files += 1
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     progress.increment()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         deltas = source.deltaiter()
                         if not fl.addgroup(deltas, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in pycompat.xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 progress.complete()
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files