upstream/mercurial-mirror Commit - r27219:beb60a89

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import tempfile

12

import tempfile

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

hex,

17

hex,

18

nullid,

18

nullid,

19

nullrev,

19

nullrev,

20

short,

20

short,

21

)

21

)

22

23

from . import (

23

from . import (

24

branchmap,

24

branchmap,

25

dagutil,

25

dagutil,

26

discovery,

26

discovery,

27

error,

27

error,

28

mdiff,

28

mdiff,

29

phases,

29

phases,

30

util,

30

util,

31

)

31

)

32

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

35

36

def readexactly(stream, n):

36

def readexactly(stream, n):

37

'''read n bytes from stream.read and abort if less was available'''

37

'''read n bytes from stream.read and abort if less was available'''

38

s = stream.read(n)

38

s = stream.read(n)

39

if len(s) < n:

39

if len(s) < n:

40

raise error.Abort(_("stream ended unexpectedly"

40

raise error.Abort(_("stream ended unexpectedly"

41

" (got %d bytes, expected %d)")

41

" (got %d bytes, expected %d)")

42

% (len(s), n))

42

% (len(s), n))

43

return s

43

return s

44

45

def getchunk(stream):

45

def getchunk(stream):

46

"""return the next chunk from stream as a string"""

46

"""return the next chunk from stream as a string"""

47

d = readexactly(stream, 4)

47

d = readexactly(stream, 4)

48

l = struct.unpack(">l", d)[0]

48

l = struct.unpack(">l", d)[0]

49

if l <= 4:

49

if l <= 4:

50

if l:

50

if l:

51

raise error.Abort(_("invalid chunk length %d") % l)

51

raise error.Abort(_("invalid chunk length %d") % l)

52

return ""

52

return ""

53

return readexactly(stream, l - 4)

53

return readexactly(stream, l - 4)

54

55

def chunkheader(length):

55

def chunkheader(length):

56

"""return a changegroup chunk header (string)"""

56

"""return a changegroup chunk header (string)"""

57

return struct.pack(">l", length + 4)

57

return struct.pack(">l", length + 4)

58

59

def closechunk():

59

def closechunk():

60

"""return a changegroup chunk header (string) for a zero-length chunk"""

60

"""return a changegroup chunk header (string) for a zero-length chunk"""

61

return struct.pack(">l", 0)

61

return struct.pack(">l", 0)

62

63

def combineresults(results):

63

def combineresults(results):

64

"""logic to combine 0 or more addchangegroup results into one"""

64

"""logic to combine 0 or more addchangegroup results into one"""

65

changedheads = 0

65

changedheads = 0

66

result = 1

66

result = 1

67

for ret in results:

67

for ret in results:

68

# If any changegroup result is 0, return 0

68

# If any changegroup result is 0, return 0

69

if ret == 0:

69

if ret == 0:

70

result = 0

70

result = 0

71

break

71

break

72

if ret < -1:

72

if ret < -1:

73

changedheads += ret + 1

73

changedheads += ret + 1

74

elif ret > 1:

74

elif ret > 1:

75

changedheads += ret - 1

75

changedheads += ret - 1

76

if changedheads > 0:

76

if changedheads > 0:

77

result = 1 + changedheads

77

result = 1 + changedheads

78

elif changedheads < 0:

78

elif changedheads < 0:

79

result = -1 + changedheads

79

result = -1 + changedheads

80

return result

80

return result

81

82

bundletypes = {

82

bundletypes = {

83

"": ("", None), # only when using unbundle on ssh and old http servers

83

"": ("", None), # only when using unbundle on ssh and old http servers

84

# since the unification ssh accepts a header but there

84

# since the unification ssh accepts a header but there

85

# is no capability signaling it.

85

# is no capability signaling it.

86

"HG20": (), # special-cased below

86

"HG20": (), # special-cased below

87

"HG10UN": ("HG10UN", None),

87

"HG10UN": ("HG10UN", None),

88

"HG10BZ": ("HG10", 'BZ'),

88

"HG10BZ": ("HG10", 'BZ'),

89

"HG10GZ": ("HG10GZ", 'GZ'),

89

"HG10GZ": ("HG10GZ", 'GZ'),

90

}

90

}

91

92

# hgweb uses this list to communicate its preferred type

92

# hgweb uses this list to communicate its preferred type

93

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

93

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

94

95

def writechunks(ui, chunks, filename, vfs=None):

95

def writechunks(ui, chunks, filename, vfs=None):

96

"""Write chunks to a file and return its filename.

96

"""Write chunks to a file and return its filename.

97

98

The stream is assumed to be a bundle file.

98

The stream is assumed to be a bundle file.

99

Existing files will not be overwritten.

99

Existing files will not be overwritten.

100

If no filename is specified, a temporary file is created.

100

If no filename is specified, a temporary file is created.

101

"""

101

"""

102

fh = None

102

fh = None

103

cleanup = None

103

cleanup = None

104

try:

104

try:

105

if filename:

105

if filename:

106

if vfs:

106

if vfs:

107

fh = vfs.open(filename, "wb")

107

fh = vfs.open(filename, "wb")

108

else:

108

else:

109

fh = open(filename, "wb")

109

fh = open(filename, "wb")

110

else:

110

else:

111

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

111

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

112

fh = os.fdopen(fd, "wb")

112

fh = os.fdopen(fd, "wb")

113

cleanup = filename

113

cleanup = filename

114

for c in chunks:

114

for c in chunks:

115

fh.write(c)

115

fh.write(c)

116

cleanup = None

116

cleanup = None

117

return filename

117

return filename

118

finally:

118

finally:

119

if fh is not None:

119

if fh is not None:

120

fh.close()

120

fh.close()

121

if cleanup is not None:

121

if cleanup is not None:

122

if filename and vfs:

122

if filename and vfs:

123

vfs.unlink(cleanup)

123

vfs.unlink(cleanup)

124

else:

124

else:

125

os.unlink(cleanup)

125

os.unlink(cleanup)

126

127

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

127

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

128

"""Write a bundle file and return its filename.

128

"""Write a bundle file and return its filename.

129

130

Existing files will not be overwritten.

130

Existing files will not be overwritten.

131

If no filename is specified, a temporary file is created.

131

If no filename is specified, a temporary file is created.

132

bz2 compression can be turned off.

132

bz2 compression can be turned off.

133

The bundle file will be deleted in case of errors.

133

The bundle file will be deleted in case of errors.

134

"""

134

"""

135

136

if bundletype == "HG20":

136

if bundletype == "HG20":

137

from . import bundle2

137

from . import bundle2

138

bundle = bundle2.bundle20(ui)

138

bundle = bundle2.bundle20(ui)

139

bundle.setcompression(compression)

139

bundle.setcompression(compression)

140

part = bundle.newpart('changegroup', data=cg.getchunks())

140

part = bundle.newpart('changegroup', data=cg.getchunks())

141

part.addparam('version', cg.version)

141

part.addparam('version', cg.version)

142

chunkiter = bundle.getchunks()

142

chunkiter = bundle.getchunks()

143

else:

143

else:

144

# compression argument is only for the bundle2 case

144

# compression argument is only for the bundle2 case

145

assert compression is None

145

assert compression is None

146

if cg.version != '01':

146

if cg.version != '01':

147

raise error.Abort(_('old bundle types only supports v1 '

147

raise error.Abort(_('old bundle types only supports v1 '

148

'changegroups'))

148

'changegroups'))

149

header, comp = bundletypes[bundletype]

149

header, comp = bundletypes[bundletype]

150

if comp not in util.compressors:

150

if comp not in util.compressors:

151

raise error.Abort(_('unknown stream compression type: %s')

151

raise error.Abort(_('unknown stream compression type: %s')

152

% comp)

152

% comp)

153

z = util.compressors[comp]()

153

z = util.compressors[comp]()

154

subchunkiter = cg.getchunks()

154

subchunkiter = cg.getchunks()

155

def chunkiter():

155

def chunkiter():

156

yield header

156

yield header

157

for chunk in subchunkiter:

157

for chunk in subchunkiter:

158

yield z.compress(chunk)

158

yield z.compress(chunk)

159

yield z.flush()

159

yield z.flush()

160

chunkiter = chunkiter()

160

chunkiter = chunkiter()

161

162

# parse the changegroup data, otherwise we will block

162

# parse the changegroup data, otherwise we will block

163

# in case of sshrepo because we don't know the end of the stream

163

# in case of sshrepo because we don't know the end of the stream

164

165

# an empty chunkgroup is the end of the changegroup

165

# an empty chunkgroup is the end of the changegroup

166

# a changegroup has at least 2 chunkgroups (changelog and manifest).

166

# a changegroup has at least 2 chunkgroups (changelog and manifest).

167

# after that, an empty chunkgroup is the end of the changegroup

167

# after that, an empty chunkgroup is the end of the changegroup

168

return writechunks(ui, chunkiter, filename, vfs=vfs)

168

return writechunks(ui, chunkiter, filename, vfs=vfs)

169

170

class cg1unpacker(object):

170

class cg1unpacker(object):

171

"""Unpacker for cg1 changegroup streams.

171

"""Unpacker for cg1 changegroup streams.

172

173

A changegroup unpacker handles the framing of the revision data in

173

A changegroup unpacker handles the framing of the revision data in

174

the wire format. Most consumers will want to use the apply()

174

the wire format. Most consumers will want to use the apply()

175

method to add the changes from the changegroup to a repository.

175

method to add the changes from the changegroup to a repository.

176

177

If you're forwarding a changegroup unmodified to another consumer,

177

If you're forwarding a changegroup unmodified to another consumer,

178

use getchunks(), which returns an iterator of changegroup

178

use getchunks(), which returns an iterator of changegroup

179

chunks. This is mostly useful for cases where you need to know the

179

chunks. This is mostly useful for cases where you need to know the

180

data stream has ended by observing the end of the changegroup.

180

data stream has ended by observing the end of the changegroup.

181

182

deltachunk() is useful only if you're applying delta data. Most

182

deltachunk() is useful only if you're applying delta data. Most

183

consumers should prefer apply() instead.

183

consumers should prefer apply() instead.

184

185

A few other public methods exist. Those are used only for

185

A few other public methods exist. Those are used only for

186

bundlerepo and some debug commands - their use is discouraged.

186

bundlerepo and some debug commands - their use is discouraged.

187

"""

187

"""

188

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

188

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

189

deltaheadersize = struct.calcsize(deltaheader)

189

deltaheadersize = struct.calcsize(deltaheader)

190

version = '01'

190

version = '01'

191

def __init__(self, fh, alg):

191

def __init__(self, fh, alg):

192

if alg == 'UN':

192

if alg == 'UN':

193

alg = None # get more modern without breaking too much

193

alg = None # get more modern without breaking too much

194

if not alg in util.decompressors:

194

if not alg in util.decompressors:

195

raise error.Abort(_('unknown stream compression type: %s')

195

raise error.Abort(_('unknown stream compression type: %s')

196

% alg)

196

% alg)

197

if alg == 'BZ':

197

if alg == 'BZ':

198

alg = '_truncatedBZ'

198

alg = '_truncatedBZ'

199

self._stream = util.decompressors[alg](fh)

199

self._stream = util.decompressors[alg](fh)

200

self._type = alg

200

self._type = alg

201

self.callback = None

201

self.callback = None

202

203

# These methods (compressed, read, seek, tell) all appear to only

203

# These methods (compressed, read, seek, tell) all appear to only

204

# be used by bundlerepo, but it's a little hard to tell.

204

# be used by bundlerepo, but it's a little hard to tell.

205

def compressed(self):

205

def compressed(self):

206

return self._type is not None

206

return self._type is not None

207

def read(self, l):

207

def read(self, l):

208

return self._stream.read(l)

208

return self._stream.read(l)

209

def seek(self, pos):

209

def seek(self, pos):

210

return self._stream.seek(pos)

210

return self._stream.seek(pos)

211

def tell(self):

211

def tell(self):

212

return self._stream.tell()

212

return self._stream.tell()

213

def close(self):

213

def close(self):

214

return self._stream.close()

214

return self._stream.close()

215

216

def _chunklength(self):

216

def _chunklength(self):

217

d = readexactly(self._stream, 4)

217

d = readexactly(self._stream, 4)

218

l = struct.unpack(">l", d)[0]

218

l = struct.unpack(">l", d)[0]

219

if l <= 4:

219

if l <= 4:

220

if l:

220

if l:

221

raise error.Abort(_("invalid chunk length %d") % l)

221

raise error.Abort(_("invalid chunk length %d") % l)

222

return 0

222

return 0

223

if self.callback:

223

if self.callback:

224

self.callback()

224

self.callback()

225

return l - 4

225

return l - 4

226

227

def changelogheader(self):

227

def changelogheader(self):

228

"""v10 does not have a changelog header chunk"""

228

"""v10 does not have a changelog header chunk"""

229

return {}

229

return {}

230

231

def manifestheader(self):

231

def manifestheader(self):

232

"""v10 does not have a manifest header chunk"""

232

"""v10 does not have a manifest header chunk"""

233

return {}

233

return {}

234

235

def filelogheader(self):

235

def filelogheader(self):

236

"""return the header of the filelogs chunk, v10 only has the filename"""

236

"""return the header of the filelogs chunk, v10 only has the filename"""

237

l = self._chunklength()

237

l = self._chunklength()

238

if not l:

238

if not l:

239

return {}

239

return {}

240

fname = readexactly(self._stream, l)

240

fname = readexactly(self._stream, l)

241

return {'filename': fname}

241

return {'filename': fname}

242

243

def _deltaheader(self, headertuple, prevnode):

243

def _deltaheader(self, headertuple, prevnode):

244

node, p1, p2, cs = headertuple

244

node, p1, p2, cs = headertuple

245

if prevnode is None:

245

if prevnode is None:

246

deltabase = p1

246

deltabase = p1

247

else:

247

else:

248

deltabase = prevnode

248

deltabase = prevnode

249

return node, p1, p2, deltabase, cs

249

return node, p1, p2, deltabase, cs

250

251

def deltachunk(self, prevnode):

251

def deltachunk(self, prevnode):

252

l = self._chunklength()

252

l = self._chunklength()

253

if not l:

253

if not l:

254

return {}

254

return {}

255

headerdata = readexactly(self._stream, self.deltaheadersize)

255

headerdata = readexactly(self._stream, self.deltaheadersize)

256

header = struct.unpack(self.deltaheader, headerdata)

256

header = struct.unpack(self.deltaheader, headerdata)

257

delta = readexactly(self._stream, l - self.deltaheadersize)

257

delta = readexactly(self._stream, l - self.deltaheadersize)

258

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

258

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

259

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

259

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

260

'deltabase': deltabase, 'delta': delta}

260

'deltabase': deltabase, 'delta': delta}

261

262

def getchunks(self):

262

def getchunks(self):

263

"""returns all the chunks contains in the bundle

263

"""returns all the chunks contains in the bundle

264

265

Used when you need to forward the binary stream to a file or another

265

Used when you need to forward the binary stream to a file or another

266

network API. To do so, it parse the changegroup data, otherwise it will

266

network API. To do so, it parse the changegroup data, otherwise it will

267

block in case of sshrepo because it don't know the end of the stream.

267

block in case of sshrepo because it don't know the end of the stream.

268

"""

268

"""

269

# an empty chunkgroup is the end of the changegroup

269

# an empty chunkgroup is the end of the changegroup

270

# a changegroup has at least 2 chunkgroups (changelog and manifest).

270

# a changegroup has at least 2 chunkgroups (changelog and manifest).

271

# after that, an empty chunkgroup is the end of the changegroup

271

# after that, an empty chunkgroup is the end of the changegroup

272

empty = False

272

empty = False

273

count = 0

273

count = 0

274

while not empty or count <= 2:

274

while not empty or count <= 2:

275

empty = True

275

empty = True

276

count += 1

276

count += 1

277

while True:

277

while True:

278

chunk = getchunk(self)

278

chunk = getchunk(self)

279

if not chunk:

279

if not chunk:

280

break

280

break

281

empty = False

281

empty = False

282

yield chunkheader(len(chunk))

282

yield chunkheader(len(chunk))

283

pos = 0

283

pos = 0

284

while pos < len(chunk):

284

while pos < len(chunk):

285

next = pos + 2**20

285

next = pos + 2**20

286

yield chunk[pos:next]

286

yield chunk[pos:next]

287

pos = next

287

pos = next

288

yield closechunk()

288

yield closechunk()

289

290

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

290

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

291

# We know that we'll never have more manifests than we had

291

# We know that we'll never have more manifests than we had

292

# changesets.

292

# changesets.

293

self.callback = prog(_('manifests'), numchanges)

293

self.callback = prog(_('manifests'), numchanges)

294

# no need to check for empty manifest group here:

294

# no need to check for empty manifest group here:

295

# if the result of the merge of 1 and 2 is the same in 3 and 4,

295

# if the result of the merge of 1 and 2 is the same in 3 and 4,

296

# no new manifest will be created and the manifest group will

296

# no new manifest will be created and the manifest group will

297

# be empty during the pull

297

# be empty during the pull

298

self.manifestheader()

298

self.manifestheader()

299

repo.manifest.addgroup(self, revmap, trp)

299

repo.manifest.addgroup(self, revmap, trp)

300

repo.ui.progress(_('manifests'), None)

300

repo.ui.progress(_('manifests'), None)

301

302

def apply(self, repo, srctype, url, emptyok=False,

302

def apply(self, repo, srctype, url, emptyok=False,

303

targetphase=phases.draft, expectedtotal=None):

303

targetphase=phases.draft, expectedtotal=None):

304

"""Add the changegroup returned by source.read() to this repo.

304

"""Add the changegroup returned by source.read() to this repo.

305

srctype is a string like 'push', 'pull', or 'unbundle'. url is

305

srctype is a string like 'push', 'pull', or 'unbundle'. url is

306

the URL of the repo where this changegroup is coming from.

306

the URL of the repo where this changegroup is coming from.

307

308

Return an integer summarizing the change to this repo:

308

Return an integer summarizing the change to this repo:

309

- nothing changed or no source: 0

309

- nothing changed or no source: 0

310

- more heads than before: 1+added heads (2..n)

310

- more heads than before: 1+added heads (2..n)

311

- fewer heads than before: -1-removed heads (-2..-n)

311

- fewer heads than before: -1-removed heads (-2..-n)

312

- number of heads stays the same: 1

312

- number of heads stays the same: 1

313

"""

313

"""

314

repo = repo.unfiltered()

314

repo = repo.unfiltered()

315

wasempty = (len(repo.changelog) == 0)

315

wasempty = (len(repo.changelog) == 0)

316

def csmap(x):

316

def csmap(x):

317

repo.ui.debug("add changeset %s\n" % short(x))

317

repo.ui.debug("add changeset %s\n" % short(x))

318

return len(cl)

318

return len(cl)

319

320

def revmap(x):

320

def revmap(x):

321

return cl.rev(x)

321

return cl.rev(x)

322

323

changesets = files = revisions = 0

323

changesets = files = revisions = 0

324

325

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

325

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

326

try:

326

try:

327

# The transaction could have been created before and already

327

# The transaction could have been created before and already

328

# carries source information. In this case we use the top

328

# carries source information. In this case we use the top

329

# level data. We overwrite the argument because we need to use

329

# level data. We overwrite the argument because we need to use

330

# the top level value (if they exist) in this function.

330

# the top level value (if they exist) in this function.

331

srctype = tr.hookargs.setdefault('source', srctype)

331

srctype = tr.hookargs.setdefault('source', srctype)

332

url = tr.hookargs.setdefault('url', url)

332

url = tr.hookargs.setdefault('url', url)

333

repo.hook('prechangegroup', throw=True, **tr.hookargs)

333

repo.hook('prechangegroup', throw=True, **tr.hookargs)

334

335

# write changelog data to temp files so concurrent readers

335

# write changelog data to temp files so concurrent readers

336

# will not see an inconsistent view

336

# will not see an inconsistent view

337

cl = repo.changelog

337

cl = repo.changelog

338

cl.delayupdate(tr)

338

cl.delayupdate(tr)

339

oldheads = cl.heads()

339

oldheads = cl.heads()

340

341

trp = weakref.proxy(tr)

341

trp = weakref.proxy(tr)

342

# pull off the changeset group

342

# pull off the changeset group

343

repo.ui.status(_("adding changesets\n"))

343

repo.ui.status(_("adding changesets\n"))

344

clstart = len(cl)

344

clstart = len(cl)

345

class prog(object):

345

class prog(object):

346

def __init__(self, step, total):

346

def __init__(self, step, total):

347

self._step = step

347

self._step = step

348

self._total = total

348

self._total = total

349

self._count = 1

349

self._count = 1

350

def __call__(self):

350

def __call__(self):

351

repo.ui.progress(self._step, self._count, unit=_('chunks'),

351

repo.ui.progress(self._step, self._count, unit=_('chunks'),

352

total=self._total)

352

total=self._total)

353

self._count += 1

353

self._count += 1

354

self.callback = prog(_('changesets'), expectedtotal)

354

self.callback = prog(_('changesets'), expectedtotal)

355

356

efiles = set()

356

efiles = set()

357

def onchangelog(cl, node):

357

def onchangelog(cl, node):

358

efiles.update(cl.read(node)[3])

358

efiles.update(cl.read(node)[3])

359

360

self.changelogheader()

360

self.changelogheader()

361

srccontent = cl.addgroup(self, csmap, trp,

361

srccontent = cl.addgroup(self, csmap, trp,

362

addrevisioncb=onchangelog)

362

addrevisioncb=onchangelog)

363

efiles = len(efiles)

363

efiles = len(efiles)

364

365

if not (srccontent or emptyok):

365

if not (srccontent or emptyok):

366

raise error.Abort(_("received changelog group is empty"))

366

raise error.Abort(_("received changelog group is empty"))

367

clend = len(cl)

367

clend = len(cl)

368

changesets = clend - clstart

368

changesets = clend - clstart

369

repo.ui.progress(_('changesets'), None)

369

repo.ui.progress(_('changesets'), None)

370

371

# pull off the manifest group

371

# pull off the manifest group

372

repo.ui.status(_("adding manifests\n"))

372

repo.ui.status(_("adding manifests\n"))

373

self._unpackmanifests(repo, revmap, trp, prog, changesets)

373

self._unpackmanifests(repo, revmap, trp, prog, changesets)

374

375

needfiles = {}

375

needfiles = {}

376

if repo.ui.configbool('server', 'validate', default=False):

376

if repo.ui.configbool('server', 'validate', default=False):

377

# validate incoming csets have their manifests

377

# validate incoming csets have their manifests

378

for cset in xrange(clstart, clend):

378

for cset in xrange(clstart, clend):

379

mfnode = repo.changelog.read(repo.changelog.node(cset))[0]

379

mfnode = repo.changelog.read(repo.changelog.node(cset))[0]

380

mfest = repo.manifest.readdelta(mfnode)

380

mfest = repo.manifest.readdelta(mfnode)

381

# store file nodes we must see

381

# store file nodes we must see

382

for f, n in mfest.iteritems():

382

for f, n in mfest.iteritems():

383

needfiles.setdefault(f, set()).add(n)

383

needfiles.setdefault(f, set()).add(n)

384

385

# process the files

385

# process the files

386

repo.ui.status(_("adding file changes\n"))

386

repo.ui.status(_("adding file changes\n"))

387

self.callback = None

387

self.callback = None

388

pr = prog(_('files'), efiles)

388

pr = prog(_('files'), efiles)

389

newrevs, newfiles = _addchangegroupfiles(

389

newrevs, newfiles = _addchangegroupfiles(

390

repo, self, revmap, trp, pr, needfiles, wasempty)

390

repo, self, revmap, trp, pr, needfiles, wasempty)

391

revisions += newrevs

391

revisions += newrevs

392

files += newfiles

392

files += newfiles

393

394

dh = 0

394

dh = 0

395

if oldheads:

395

if oldheads:

396

heads = cl.heads()

396

heads = cl.heads()

397

dh = len(heads) - len(oldheads)

397

dh = len(heads) - len(oldheads)

398

for h in heads:

398

for h in heads:

399

if h not in oldheads and repo[h].closesbranch():

399

if h not in oldheads and repo[h].closesbranch():

400

dh -= 1

400

dh -= 1

401

htext = ""

401

htext = ""

402

if dh:

402

if dh:

403

htext = _(" (%+d heads)") % dh

403

htext = _(" (%+d heads)") % dh

404

405

repo.ui.status(_("added %d changesets"

405

repo.ui.status(_("added %d changesets"

406

" with %d changes to %d files%s\n")

406

" with %d changes to %d files%s\n")

407

% (changesets, revisions, files, htext))

407

% (changesets, revisions, files, htext))

408

repo.invalidatevolatilesets()

408

repo.invalidatevolatilesets()

409

410

if changesets > 0:

410

if changesets > 0:

411

if 'node' not in tr.hookargs:

411

if 'node' not in tr.hookargs:

412

tr.hookargs['node'] = hex(cl.node(clstart))

412

tr.hookargs['node'] = hex(cl.node(clstart))

413

hookargs = dict(tr.hookargs)

413

hookargs = dict(tr.hookargs)

414

else:

414

else:

415

hookargs = dict(tr.hookargs)

415

hookargs = dict(tr.hookargs)

416

hookargs['node'] = hex(cl.node(clstart))

416

hookargs['node'] = hex(cl.node(clstart))

417

repo.hook('pretxnchangegroup', throw=True, **hookargs)

417

repo.hook('pretxnchangegroup', throw=True, **hookargs)

418

419

added = [cl.node(r) for r in xrange(clstart, clend)]

419

added = [cl.node(r) for r in xrange(clstart, clend)]

420

publishing = repo.publishing()

420

publishing = repo.publishing()

421

if srctype in ('push', 'serve'):

421

if srctype in ('push', 'serve'):

422

# Old servers can not push the boundary themselves.

422

# Old servers can not push the boundary themselves.

423

# New servers won't push the boundary if changeset already

423

# New servers won't push the boundary if changeset already

424

# exists locally as secret

424

# exists locally as secret

425

#

425

#

426

# We should not use added here but the list of all change in

426

# We should not use added here but the list of all change in

427

# the bundle

427

# the bundle

428

if publishing:

428

if publishing:

429

phases.advanceboundary(repo, tr, phases.public, srccontent)

429

phases.advanceboundary(repo, tr, phases.public, srccontent)

430

else:

430

else:

431

# Those changesets have been pushed from the outside, their

431

# Those changesets have been pushed from the outside, their

432

# phases are going to be pushed alongside. Therefor

432

# phases are going to be pushed alongside. Therefor

433

# `targetphase` is ignored.

433

# `targetphase` is ignored.

434

phases.advanceboundary(repo, tr, phases.draft, srccontent)

434

phases.advanceboundary(repo, tr, phases.draft, srccontent)

435

phases.retractboundary(repo, tr, phases.draft, added)

435

phases.retractboundary(repo, tr, phases.draft, added)

436

elif srctype != 'strip':

436

elif srctype != 'strip':

437

# publishing only alter behavior during push

437

# publishing only alter behavior during push

438

#

438

#

439

# strip should not touch boundary at all

439

# strip should not touch boundary at all

440

phases.retractboundary(repo, tr, targetphase, added)

440

phases.retractboundary(repo, tr, targetphase, added)

441

442

if changesets > 0:

442

if changesets > 0:

443

if srctype != 'strip':

443

if srctype != 'strip':

444

# During strip, branchcache is invalid but coming call to

444

# During strip, branchcache is invalid but coming call to

445

# `destroyed` will repair it.

445

# `destroyed` will repair it.

446

# In other case we can safely update cache on disk.

446

# In other case we can safely update cache on disk.

447

branchmap.updatecache(repo.filtered('served'))

447

branchmap.updatecache(repo.filtered('served'))

448

449

def runhooks():

449

def runhooks():

450

# These hooks run when the lock releases, not when the

450

# These hooks run when the lock releases, not when the

451

# transaction closes. So it's possible for the changelog

451

# transaction closes. So it's possible for the changelog

452

# to have changed since we last saw it.

452

# to have changed since we last saw it.

453

if clstart >= len(repo):

453

if clstart >= len(repo):

454

return

454

return

455

456

# forcefully update the on-disk branch cache

456

# forcefully update the on-disk branch cache

457

repo.ui.debug("updating the branch cache\n")

457

repo.ui.debug("updating the branch cache\n")

458

repo.hook("changegroup", **hookargs)

458

repo.hook("changegroup", **hookargs)

459

460

for n in added:

460

for n in added:

461

args = hookargs.copy()

461

args = hookargs.copy()

462

args['node'] = hex(n)

462

args['node'] = hex(n)

463

repo.hook("incoming", **args)

463

repo.hook("incoming", **args)

464

465

newheads = [h for h in repo.heads() if h not in oldheads]

465

newheads = [h for h in repo.heads() if h not in oldheads]

466

repo.ui.log("incoming",

466

repo.ui.log("incoming",

467

"%s incoming changes - new heads: %s\n",

467

"%s incoming changes - new heads: %s\n",

468

len(added),

468

len(added),

469

', '.join([hex(c[:6]) for c in newheads]))

469

', '.join([hex(c[:6]) for c in newheads]))

470

471

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

471

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

472

lambda tr: repo._afterlock(runhooks))

472

lambda tr: repo._afterlock(runhooks))

473

474

tr.close()

474

tr.close()

475

476

finally:

476

finally:

477

tr.release()

477

tr.release()

478

repo.ui.flush()

478

repo.ui.flush()

479

# never return 0 here:

479

# never return 0 here:

480

if dh < 0:

480

if dh < 0:

481

return dh - 1

481

return dh - 1

482

else:

482

else:

483

return dh + 1

483

return dh + 1

484

485

class cg2unpacker(cg1unpacker):

485

class cg2unpacker(cg1unpacker):

486

"""Unpacker for cg2 streams.

486

"""Unpacker for cg2 streams.

487

488

cg2 streams add support for generaldelta, so the delta header

488

cg2 streams add support for generaldelta, so the delta header

489

format is slightly different. All other features about the data

489

format is slightly different. All other features about the data

490

remain the same.

490

remain the same.

491

"""

491

"""

492

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

492

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

493

deltaheadersize = struct.calcsize(deltaheader)

493

deltaheadersize = struct.calcsize(deltaheader)

494

version = '02'

494

version = '02'

495

496

def _deltaheader(self, headertuple, prevnode):

496

def _deltaheader(self, headertuple, prevnode):

497

node, p1, p2, deltabase, cs = headertuple

497

node, p1, p2, deltabase, cs = headertuple

498

return node, p1, p2, deltabase, cs

498

return node, p1, p2, deltabase, cs

499

500

class headerlessfixup(object):

500

class headerlessfixup(object):

501

def __init__(self, fh, h):

501

def __init__(self, fh, h):

502

self._h = h

502

self._h = h

503

self._fh = fh

503

self._fh = fh

504

def read(self, n):

504

def read(self, n):

505

if self._h:

505

if self._h:

506

d, self._h = self._h[:n], self._h[n:]

506

d, self._h = self._h[:n], self._h[n:]

507

if len(d) < n:

507

if len(d) < n:

508

d += readexactly(self._fh, n - len(d))

508

d += readexactly(self._fh, n - len(d))

509

return d

509

return d

510

return readexactly(self._fh, n)

510

return readexactly(self._fh, n)

511

512

class cg1packer(object):

512

class cg1packer(object):

513

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

513

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

514

version = '01'

514

version = '01'

515

def __init__(self, repo, bundlecaps=None):

515

def __init__(self, repo, bundlecaps=None):

516

"""Given a source repo, construct a bundler.

516

"""Given a source repo, construct a bundler.

517

518

bundlecaps is optional and can be used to specify the set of

518

bundlecaps is optional and can be used to specify the set of

519

capabilities which can be used to build the bundle.

519

capabilities which can be used to build the bundle.

520

"""

520

"""

521

# Set of capabilities we can use to build the bundle.

521

# Set of capabilities we can use to build the bundle.

522

if bundlecaps is None:

522

if bundlecaps is None:

523

bundlecaps = set()

523

bundlecaps = set()

524

self._bundlecaps = bundlecaps

524

self._bundlecaps = bundlecaps

525

# experimental config: bundle.reorder

525

# experimental config: bundle.reorder

526

reorder = repo.ui.config('bundle', 'reorder', 'auto')

526

reorder = repo.ui.config('bundle', 'reorder', 'auto')

527

if reorder == 'auto':

527

if reorder == 'auto':

528

reorder = None

528

reorder = None

529

else:

529

else:

530

reorder = util.parsebool(reorder)

530

reorder = util.parsebool(reorder)

531

self._repo = repo

531

self._repo = repo

532

self._reorder = reorder

532

self._reorder = reorder

533

self._progress = repo.ui.progress

533

self._progress = repo.ui.progress

534

if self._repo.ui.verbose and not self._repo.ui.debugflag:

534

if self._repo.ui.verbose and not self._repo.ui.debugflag:

535

self._verbosenote = self._repo.ui.note

535

self._verbosenote = self._repo.ui.note

536

else:

536

else:

537

self._verbosenote = lambda s: None

537

self._verbosenote = lambda s: None

538

539

def close(self):

539

def close(self):

540

return closechunk()

540

return closechunk()

541

542

def fileheader(self, fname):

542

def fileheader(self, fname):

543

return chunkheader(len(fname)) + fname

543

return chunkheader(len(fname)) + fname

544

545

def group(self, nodelist, revlog, lookup, units=None):

545

def group(self, nodelist, revlog, lookup, units=None):

546

"""Calculate a delta group, yielding a sequence of changegroup chunks

546

"""Calculate a delta group, yielding a sequence of changegroup chunks

547

(strings).

547

(strings).

548

549

Given a list of changeset revs, return a set of deltas and

549

Given a list of changeset revs, return a set of deltas and

550

metadata corresponding to nodes. The first delta is

550

metadata corresponding to nodes. The first delta is

551

first parent(nodelist[0]) -> nodelist[0], the receiver is

551

first parent(nodelist[0]) -> nodelist[0], the receiver is

552

guaranteed to have this parent as it has all history before

552

guaranteed to have this parent as it has all history before

553

these changesets. In the case firstparent is nullrev the

553

these changesets. In the case firstparent is nullrev the

554

changegroup starts with a full revision.

554

changegroup starts with a full revision.

555

556

If units is not None, progress detail will be generated, units specifies

556

If units is not None, progress detail will be generated, units specifies

557

the type of revlog that is touched (changelog, manifest, etc.).

557

the type of revlog that is touched (changelog, manifest, etc.).

558

"""

558

"""

559

# if we don't have any revisions touched by these changesets, bail

559

# if we don't have any revisions touched by these changesets, bail

560

if len(nodelist) == 0:

560

if len(nodelist) == 0:

561

yield self.close()

561

yield self.close()

562

return

562

return

563

564

# for generaldelta revlogs, we linearize the revs; this will both be

564

# for generaldelta revlogs, we linearize the revs; this will both be

565

# much quicker and generate a much smaller bundle

565

# much quicker and generate a much smaller bundle

566

if (revlog._generaldelta and self._reorder is None) or self._reorder:

566

if (revlog._generaldelta and self._reorder is None) or self._reorder:

567

dag = dagutil.revlogdag(revlog)

567

dag = dagutil.revlogdag(revlog)

568

revs = set(revlog.rev(n) for n in nodelist)

568

revs = set(revlog.rev(n) for n in nodelist)

569

revs = dag.linearize(revs)

569

revs = dag.linearize(revs)

570

else:

570

else:

571

revs = sorted([revlog.rev(n) for n in nodelist])

571

revs = sorted([revlog.rev(n) for n in nodelist])

572

573

# add the parent of the first rev

573

# add the parent of the first rev

574

p = revlog.parentrevs(revs[0])[0]

574

p = revlog.parentrevs(revs[0])[0]

575

revs.insert(0, p)

575

revs.insert(0, p)

576

577

# build deltas

577

# build deltas

578

total = len(revs) - 1

578

total = len(revs) - 1

579

msgbundling = _('bundling')

579

msgbundling = _('bundling')

580

for r in xrange(len(revs) - 1):

580

for r in xrange(len(revs) - 1):

581

if units is not None:

581

if units is not None:

582

self._progress(msgbundling, r + 1, unit=units, total=total)

582

self._progress(msgbundling, r + 1, unit=units, total=total)

583

prev, curr = revs[r], revs[r + 1]

583

prev, curr = revs[r], revs[r + 1]

584

linknode = lookup(revlog.node(curr))

584

linknode = lookup(revlog.node(curr))

585

for c in self.revchunk(revlog, curr, prev, linknode):

585

for c in self.revchunk(revlog, curr, prev, linknode):

586

yield c

586

yield c

587

588

if units is not None:

588

if units is not None:

589

self._progress(msgbundling, None)

589

self._progress(msgbundling, None)

590

yield self.close()

590

yield self.close()

591

592

# filter any nodes that claim to be part of the known set

592

# filter any nodes that claim to be part of the known set

593

def prune(self, revlog, missing, commonrevs):

593

def prune(self, revlog, missing, commonrevs):

594

rr, rl = revlog.rev, revlog.linkrev

594

rr, rl = revlog.rev, revlog.linkrev

595

return [n for n in missing if rl(rr(n)) not in commonrevs]

595

return [n for n in missing if rl(rr(n)) not in commonrevs]

596

597

def _packmanifests(self, mfnodes, lookuplinknode):

597

def _packmanifests(self, mfnodes, lookuplinknode):

598

"""Pack flat manifests into a changegroup stream."""

598

"""Pack flat manifests into a changegroup stream."""

599

ml = self._repo.manifest

599

ml = self._repo.manifest

600

size = 0

600

size = 0

601

for chunk in self.group(

601

for chunk in self.group(

602

mfnodes, ml, lookuplinknode, units=_('manifests')):

602

mfnodes, ml, lookuplinknode, units=_('manifests')):

603

size += len(chunk)

603

size += len(chunk)

604

yield chunk

604

yield chunk

605

self._verbosenote(_('%8.i (manifests)\n') % size)

605

self._verbosenote(_('%8.i (manifests)\n') % size)

606

607

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

607

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

608

'''yield a sequence of changegroup chunks (strings)'''

608

'''yield a sequence of changegroup chunks (strings)'''

609

repo = self._repo

609

repo = self._repo

610

cl = repo.changelog

610

cl = repo.changelog

611

ml = repo.manifest

611

ml = repo.manifest

612

613

clrevorder = {}

613

clrevorder = {}

614

mfs = {} # needed manifests

614

mfs = {} # needed manifests

615

fnodes = {} # needed file nodes

615

fnodes = {} # needed file nodes

616

changedfiles = set()

616

changedfiles = set()

617

618

# Callback for the changelog, used to collect changed files and manifest

618

# Callback for the changelog, used to collect changed files and manifest

619

# nodes.

619

# nodes.

620

# Returns the linkrev node (identity in the changelog case).

620

# Returns the linkrev node (identity in the changelog case).

621

def lookupcl(x):

621

def lookupcl(x):

622

c = cl.read(x)

622

c = cl.read(x)

623

clrevorder[x] = len(clrevorder)

623

clrevorder[x] = len(clrevorder)

624

changedfiles.update(c[3])

624

changedfiles.update(c[3])

625

# record the first changeset introducing this manifest version

625

# record the first changeset introducing this manifest version

626

mfs.setdefault(c[0], x)

626

mfs.setdefault(c[0], x)

627

return x

627

return x

628

629

self._verbosenote(_('uncompressed size of bundle content:\n'))

629

self._verbosenote(_('uncompressed size of bundle content:\n'))

630

size = 0

630

size = 0

631

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

631

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

632

size += len(chunk)

632

size += len(chunk)

633

yield chunk

633

yield chunk

634

self._verbosenote(_('%8.i (changelog)\n') % size)

634

self._verbosenote(_('%8.i (changelog)\n') % size)

635

636

# We need to make sure that the linkrev in the changegroup refers to

636

# We need to make sure that the linkrev in the changegroup refers to

637

# the first changeset that introduced the manifest or file revision.

637

# the first changeset that introduced the manifest or file revision.

638

# The fastpath is usually safer than the slowpath, because the filelogs

638

# The fastpath is usually safer than the slowpath, because the filelogs

639

# are walked in revlog order.

639

# are walked in revlog order.

640

#

640

#

641

# When taking the slowpath with reorder=None and the manifest revlog

641

# When taking the slowpath with reorder=None and the manifest revlog

642

# uses generaldelta, the manifest may be walked in the "wrong" order.

642

# uses generaldelta, the manifest may be walked in the "wrong" order.

643

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

643

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

644

# cc0ff93d0c0c).

644

# cc0ff93d0c0c).

645

#

645

#

646

# When taking the fastpath, we are only vulnerable to reordering

646

# When taking the fastpath, we are only vulnerable to reordering

647

# of the changelog itself. The changelog never uses generaldelta, so

647

# of the changelog itself. The changelog never uses generaldelta, so

648

# it is only reordered when reorder=True. To handle this case, we

648

# it is only reordered when reorder=True. To handle this case, we

649

# simply take the slowpath, which already has the 'clrevorder' logic.

649

# simply take the slowpath, which already has the 'clrevorder' logic.

650

# This was also fixed in cc0ff93d0c0c.

650

# This was also fixed in cc0ff93d0c0c.

651

fastpathlinkrev = fastpathlinkrev and not self._reorder

651

fastpathlinkrev = fastpathlinkrev and not self._reorder

652

# Callback for the manifest, used to collect linkrevs for filelog

652

# Callback for the manifest, used to collect linkrevs for filelog

653

# revisions.

653

# revisions.

654

# Returns the linkrev node (collected in lookupcl).

654

# Returns the linkrev node (collected in lookupcl).

655

def lookupmflinknode(x):

655

def lookupmflinknode(x):

656

"""Callback for looking up the linknode for manifests.

657

658

Returns the linkrev node for the specified manifest.

659

660

SIDE EFFECT:

661

662

fclnodes gets populated with the list of relevant

663

file nodes if we're not using fastpathlinkrev.

664

665

Note that this means you can't trust fclnodes until

666

after manifests have been sent to the client.

667

"""

656

clnode = mfs[x]

668

clnode = mfs[x]

657

if not fastpathlinkrev:

669

if not fastpathlinkrev:

658

mdata = ml.readfast(x)

670

mdata = ml.readfast(x)

659

for f, n in mdata.iteritems():

671

for f, n in mdata.iteritems():

660

if f in changedfiles:

672

if f in changedfiles:

661

# record the first changeset introducing this filelog

673

# record the first changeset introducing this filelog

662

# version

674

# version

663

fclnodes = fnodes.setdefault(f, {})

675

fclnodes = fnodes.setdefault(f, {})

664

fclnode = fclnodes.setdefault(n, clnode)

676

fclnode = fclnodes.setdefault(n, clnode)

665

if clrevorder[clnode] < clrevorder[fclnode]:

677

if clrevorder[clnode] < clrevorder[fclnode]:

666

fclnodes[n] = clnode

678

fclnodes[n] = clnode

667

return clnode

679

return clnode

668

680

669

mfnodes = self.prune(ml, mfs, commonrevs)

681

mfnodes = self.prune(ml, mfs, commonrevs)

670

for x in self._packmanifests(mfnodes, lookupmflinknode):

682

for x in self._packmanifests(mfnodes, lookupmflinknode):

671

yield x

683

yield x

672

684

673

mfs.clear()

685

mfs.clear()

674

clrevs = set(cl.rev(x) for x in clnodes)

686

clrevs = set(cl.rev(x) for x in clnodes)

675

687

676

def linknodes(filerevlog, fname):

688

def linknodes(filerevlog, fname):

677

if fastpathlinkrev:

689

if fastpathlinkrev:

678

llr = filerevlog.linkrev

690

llr = filerevlog.linkrev

679

def genfilenodes():

691

def genfilenodes():

680

for r in filerevlog:

692

for r in filerevlog:

681

linkrev = llr(r)

693

linkrev = llr(r)

682

if linkrev in clrevs:

694

if linkrev in clrevs:

683

yield filerevlog.node(r), cl.node(linkrev)

695

yield filerevlog.node(r), cl.node(linkrev)

684

return dict(genfilenodes())

696

return dict(genfilenodes())

685

return fnodes.get(fname, {})

697

return fnodes.get(fname, {})

686

698

687

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

699

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

688

source):

700

source):

689

yield chunk

701

yield chunk

690

702

691

yield self.close()

703

yield self.close()

692

704

693

if clnodes:

705

if clnodes:

694

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

706

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

695

707

696

# The 'source' parameter is useful for extensions

708

# The 'source' parameter is useful for extensions

697

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

709

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

698

repo = self._repo

710

repo = self._repo

699

progress = self._progress

711

progress = self._progress

700

msgbundling = _('bundling')

712

msgbundling = _('bundling')

701

713

702

total = len(changedfiles)

714

total = len(changedfiles)

703

# for progress output

715

# for progress output

704

msgfiles = _('files')

716

msgfiles = _('files')

705

for i, fname in enumerate(sorted(changedfiles)):

717

for i, fname in enumerate(sorted(changedfiles)):

706

filerevlog = repo.file(fname)

718

filerevlog = repo.file(fname)

707

if not filerevlog:

719

if not filerevlog:

708

raise error.Abort(_("empty or missing revlog for %s") % fname)

720

raise error.Abort(_("empty or missing revlog for %s") % fname)

709

721

710

linkrevnodes = linknodes(filerevlog, fname)

722

linkrevnodes = linknodes(filerevlog, fname)

711

# Lookup for filenodes, we collected the linkrev nodes above in the

723

# Lookup for filenodes, we collected the linkrev nodes above in the

712

# fastpath case and with lookupmf in the slowpath case.

724

# fastpath case and with lookupmf in the slowpath case.

713

def lookupfilelog(x):

725

def lookupfilelog(x):

714

return linkrevnodes[x]

726

return linkrevnodes[x]

715

727

716

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

728

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

717

if filenodes:

729

if filenodes:

718

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

730

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

719

total=total)

731

total=total)

720

h = self.fileheader(fname)

732

h = self.fileheader(fname)

721

size = len(h)

733

size = len(h)

722

yield h

734

yield h

723

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

735

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

724

size += len(chunk)

736

size += len(chunk)

725

yield chunk

737

yield chunk

726

self._verbosenote(_('%8.i %s\n') % (size, fname))

738

self._verbosenote(_('%8.i %s\n') % (size, fname))

727

progress(msgbundling, None)

739

progress(msgbundling, None)

728

740

729

def deltaparent(self, revlog, rev, p1, p2, prev):

741

def deltaparent(self, revlog, rev, p1, p2, prev):

730

return prev

742

return prev

731

743

732

def revchunk(self, revlog, rev, prev, linknode):

744

def revchunk(self, revlog, rev, prev, linknode):

733

node = revlog.node(rev)

745

node = revlog.node(rev)

734

p1, p2 = revlog.parentrevs(rev)

746

p1, p2 = revlog.parentrevs(rev)

735

base = self.deltaparent(revlog, rev, p1, p2, prev)

747

base = self.deltaparent(revlog, rev, p1, p2, prev)

736

748

737

prefix = ''

749

prefix = ''

738

if revlog.iscensored(base) or revlog.iscensored(rev):

750

if revlog.iscensored(base) or revlog.iscensored(rev):

739

try:

751

try:

740

delta = revlog.revision(node)

752

delta = revlog.revision(node)

741

except error.CensoredNodeError as e:

753

except error.CensoredNodeError as e:

742

delta = e.tombstone

754

delta = e.tombstone

743

if base == nullrev:

755

if base == nullrev:

744

prefix = mdiff.trivialdiffheader(len(delta))

756

prefix = mdiff.trivialdiffheader(len(delta))

745

else:

757

else:

746

baselen = revlog.rawsize(base)

758

baselen = revlog.rawsize(base)

747

prefix = mdiff.replacediffheader(baselen, len(delta))

759

prefix = mdiff.replacediffheader(baselen, len(delta))

748

elif base == nullrev:

760

elif base == nullrev:

749

delta = revlog.revision(node)

761

delta = revlog.revision(node)

750

prefix = mdiff.trivialdiffheader(len(delta))

762

prefix = mdiff.trivialdiffheader(len(delta))

751

else:

763

else:

752

delta = revlog.revdiff(base, rev)

764

delta = revlog.revdiff(base, rev)

753

p1n, p2n = revlog.parents(node)

765

p1n, p2n = revlog.parents(node)

754

basenode = revlog.node(base)

766

basenode = revlog.node(base)

755

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

767

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

756

meta += prefix

768

meta += prefix

757

l = len(meta) + len(delta)

769

l = len(meta) + len(delta)

758

yield chunkheader(l)

770

yield chunkheader(l)

759

yield meta

771

yield meta

760

yield delta

772

yield delta

761

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

773

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

762

# do nothing with basenode, it is implicitly the previous one in HG10

774

# do nothing with basenode, it is implicitly the previous one in HG10

763

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

775

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

764

776

765

class cg2packer(cg1packer):

777

class cg2packer(cg1packer):

766

version = '02'

778

version = '02'

767

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

779

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

768

780

769

def __init__(self, repo, bundlecaps=None):

781

def __init__(self, repo, bundlecaps=None):

770

super(cg2packer, self).__init__(repo, bundlecaps)

782

super(cg2packer, self).__init__(repo, bundlecaps)

771

if self._reorder is None:

783

if self._reorder is None:

772

# Since generaldelta is directly supported by cg2, reordering

784

# Since generaldelta is directly supported by cg2, reordering

773

# generally doesn't help, so we disable it by default (treating

785

# generally doesn't help, so we disable it by default (treating

774

# bundle.reorder=auto just like bundle.reorder=False).

786

# bundle.reorder=auto just like bundle.reorder=False).

775

self._reorder = False

787

self._reorder = False

776

788

777

def deltaparent(self, revlog, rev, p1, p2, prev):

789

def deltaparent(self, revlog, rev, p1, p2, prev):

778

dp = revlog.deltaparent(rev)

790

dp = revlog.deltaparent(rev)

779

# avoid storing full revisions; pick prev in those cases

791

# avoid storing full revisions; pick prev in those cases

780

# also pick prev when we can't be sure remote has dp

792

# also pick prev when we can't be sure remote has dp

781

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

793

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

782

return prev

794

return prev

783

return dp

795

return dp

784

796

785

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

797

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

786

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

798

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

787

799

788

packermap = {'01': (cg1packer, cg1unpacker),

800

packermap = {'01': (cg1packer, cg1unpacker),

789

# cg2 adds support for exchanging generaldelta

801

# cg2 adds support for exchanging generaldelta

790

'02': (cg2packer, cg2unpacker),

802

'02': (cg2packer, cg2unpacker),

791

}

803

}

792

804

793

def _changegroupinfo(repo, nodes, source):

805

def _changegroupinfo(repo, nodes, source):

794

if repo.ui.verbose or source == 'bundle':

806

if repo.ui.verbose or source == 'bundle':

795

repo.ui.status(_("%d changesets found\n") % len(nodes))

807

repo.ui.status(_("%d changesets found\n") % len(nodes))

796

if repo.ui.debugflag:

808

if repo.ui.debugflag:

797

repo.ui.debug("list of changesets:\n")

809

repo.ui.debug("list of changesets:\n")

798

for node in nodes:

810

for node in nodes:

799

repo.ui.debug("%s\n" % hex(node))

811

repo.ui.debug("%s\n" % hex(node))

800

812

801

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

813

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

802

repo = repo.unfiltered()

814

repo = repo.unfiltered()

803

commonrevs = outgoing.common

815

commonrevs = outgoing.common

804

csets = outgoing.missing

816

csets = outgoing.missing

805

heads = outgoing.missingheads

817

heads = outgoing.missingheads

806

# We go through the fast path if we get told to, or if all (unfiltered

818

# We go through the fast path if we get told to, or if all (unfiltered

807

# heads have been requested (since we then know there all linkrevs will

819

# heads have been requested (since we then know there all linkrevs will

808

# be pulled by the client).

820

# be pulled by the client).

809

heads.sort()

821

heads.sort()

810

fastpathlinkrev = fastpath or (

822

fastpathlinkrev = fastpath or (

811

repo.filtername is None and heads == sorted(repo.heads()))

823

repo.filtername is None and heads == sorted(repo.heads()))

812

824

813

repo.hook('preoutgoing', throw=True, source=source)

825

repo.hook('preoutgoing', throw=True, source=source)

814

_changegroupinfo(repo, csets, source)

826

_changegroupinfo(repo, csets, source)

815

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

827

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

816

828

817

def getsubset(repo, outgoing, bundler, source, fastpath=False):

829

def getsubset(repo, outgoing, bundler, source, fastpath=False):

818

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

830

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

819

return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)

831

return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)

820

832

821

def changegroupsubset(repo, roots, heads, source, version='01'):

833

def changegroupsubset(repo, roots, heads, source, version='01'):

822

"""Compute a changegroup consisting of all the nodes that are

834

"""Compute a changegroup consisting of all the nodes that are

823

descendants of any of the roots and ancestors of any of the heads.

835

descendants of any of the roots and ancestors of any of the heads.

824

Return a chunkbuffer object whose read() method will return

836

Return a chunkbuffer object whose read() method will return

825

successive changegroup chunks.

837

successive changegroup chunks.

826

838

827

It is fairly complex as determining which filenodes and which

839

It is fairly complex as determining which filenodes and which

828

manifest nodes need to be included for the changeset to be complete

840

manifest nodes need to be included for the changeset to be complete

829

is non-trivial.

841

is non-trivial.

830

842

831

Another wrinkle is doing the reverse, figuring out which changeset in

843

Another wrinkle is doing the reverse, figuring out which changeset in

832

the changegroup a particular filenode or manifestnode belongs to.

844

the changegroup a particular filenode or manifestnode belongs to.

833

"""

845

"""

834

cl = repo.changelog

846

cl = repo.changelog

835

if not roots:

847

if not roots:

836

roots = [nullid]

848

roots = [nullid]

837

discbases = []

849

discbases = []

838

for n in roots:

850

for n in roots:

839

discbases.extend([p for p in cl.parents(n) if p != nullid])

851

discbases.extend([p for p in cl.parents(n) if p != nullid])

840

# TODO: remove call to nodesbetween.

852

# TODO: remove call to nodesbetween.

841

csets, roots, heads = cl.nodesbetween(roots, heads)

853

csets, roots, heads = cl.nodesbetween(roots, heads)

842

included = set(csets)

854

included = set(csets)

843

discbases = [n for n in discbases if n not in included]

855

discbases = [n for n in discbases if n not in included]

844

outgoing = discovery.outgoing(cl, discbases, heads)

856

outgoing = discovery.outgoing(cl, discbases, heads)

845

bundler = packermap[version][0](repo)

857

bundler = packermap[version][0](repo)

846

return getsubset(repo, outgoing, bundler, source)

858

return getsubset(repo, outgoing, bundler, source)

847

859

848

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

860

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

849

version='01'):

861

version='01'):

850

"""Like getbundle, but taking a discovery.outgoing as an argument.

862

"""Like getbundle, but taking a discovery.outgoing as an argument.

851

863

852

This is only implemented for local repos and reuses potentially

864

This is only implemented for local repos and reuses potentially

853

precomputed sets in outgoing. Returns a raw changegroup generator."""

865

precomputed sets in outgoing. Returns a raw changegroup generator."""

854

if not outgoing.missing:

866

if not outgoing.missing:

855

return None

867

return None

856

bundler = packermap[version][0](repo, bundlecaps)

868

bundler = packermap[version][0](repo, bundlecaps)

857

return getsubsetraw(repo, outgoing, bundler, source)

869

return getsubsetraw(repo, outgoing, bundler, source)

858

870

859

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

871

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

860

version='01'):

872

version='01'):

861

"""Like getbundle, but taking a discovery.outgoing as an argument.

873

"""Like getbundle, but taking a discovery.outgoing as an argument.

862

874

863

This is only implemented for local repos and reuses potentially

875

This is only implemented for local repos and reuses potentially

864

precomputed sets in outgoing."""

876

precomputed sets in outgoing."""

865

if not outgoing.missing:

877

if not outgoing.missing:

866

return None

878

return None

867

bundler = packermap[version][0](repo, bundlecaps)

879

bundler = packermap[version][0](repo, bundlecaps)

868

return getsubset(repo, outgoing, bundler, source)

880

return getsubset(repo, outgoing, bundler, source)

869

881

870

def computeoutgoing(repo, heads, common):

882

def computeoutgoing(repo, heads, common):

871

"""Computes which revs are outgoing given a set of common

883

"""Computes which revs are outgoing given a set of common

872

and a set of heads.

884

and a set of heads.

873

885

874

This is a separate function so extensions can have access to

886

This is a separate function so extensions can have access to

875

the logic.

887

the logic.

876

888

877

Returns a discovery.outgoing object.

889

Returns a discovery.outgoing object.

878

"""

890

"""

879

cl = repo.changelog

891

cl = repo.changelog

880

if common:

892

if common:

881

hasnode = cl.hasnode

893

hasnode = cl.hasnode

882

common = [n for n in common if hasnode(n)]

894

common = [n for n in common if hasnode(n)]

883

else:

895

else:

884

common = [nullid]

896

common = [nullid]

885

if not heads:

897

if not heads:

886

heads = cl.heads()

898

heads = cl.heads()

887

return discovery.outgoing(cl, common, heads)

899

return discovery.outgoing(cl, common, heads)

888

900

889

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

901

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

890

version='01'):

902

version='01'):

891

"""Like changegroupsubset, but returns the set difference between the

903

"""Like changegroupsubset, but returns the set difference between the

892

ancestors of heads and the ancestors common.

904

ancestors of heads and the ancestors common.

893

905

894

If heads is None, use the local heads. If common is None, use [nullid].

906

If heads is None, use the local heads. If common is None, use [nullid].

895

907

896

The nodes in common might not all be known locally due to the way the

908

The nodes in common might not all be known locally due to the way the

897

current discovery protocol works.

909

current discovery protocol works.

898

"""

910

"""

899

outgoing = computeoutgoing(repo, heads, common)

911

outgoing = computeoutgoing(repo, heads, common)

900

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

912

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

901

version=version)

913

version=version)

902

914

903

def changegroup(repo, basenodes, source):

915

def changegroup(repo, basenodes, source):

904

# to avoid a race we use changegroupsubset() (issue1320)

916

# to avoid a race we use changegroupsubset() (issue1320)

905

return changegroupsubset(repo, basenodes, repo.heads(), source)

917

return changegroupsubset(repo, basenodes, repo.heads(), source)

906

918

907

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):

919

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):

908

revisions = 0

920

revisions = 0

909

files = 0

921

files = 0

910

while True:

922

while True:

911

chunkdata = source.filelogheader()

923

chunkdata = source.filelogheader()

912

if not chunkdata:

924

if not chunkdata:

913

break

925

break

914

f = chunkdata["filename"]

926

f = chunkdata["filename"]

915

repo.ui.debug("adding %s revisions\n" % f)

927

repo.ui.debug("adding %s revisions\n" % f)

916

pr()

928

pr()

917

fl = repo.file(f)

929

fl = repo.file(f)

918

o = len(fl)

930

o = len(fl)

919

try:

931

try:

920

if not fl.addgroup(source, revmap, trp):

932

if not fl.addgroup(source, revmap, trp):

921

raise error.Abort(_("received file revlog group is empty"))

933

raise error.Abort(_("received file revlog group is empty"))

922

except error.CensoredBaseError as e:

934

except error.CensoredBaseError as e:

923

raise error.Abort(_("received delta base is censored: %s") % e)

935

raise error.Abort(_("received delta base is censored: %s") % e)

924

revisions += len(fl) - o

936

revisions += len(fl) - o

925

files += 1

937

files += 1

926

if f in needfiles:

938

if f in needfiles:

927

needs = needfiles[f]

939

needs = needfiles[f]

928

for new in xrange(o, len(fl)):

940

for new in xrange(o, len(fl)):

929

n = fl.node(new)

941

n = fl.node(new)

930

if n in needs:

942

if n in needs:

931

needs.remove(n)

943

needs.remove(n)

932

else:

944

else:

933

raise error.Abort(

945

raise error.Abort(

934

_("received spurious file revlog entry"))

946

_("received spurious file revlog entry"))

935

if not needs:

947

if not needs:

936

del needfiles[f]

948

del needfiles[f]

937

repo.ui.progress(_('files'), None)

949

repo.ui.progress(_('files'), None)

938

950

939

for f, needs in needfiles.iteritems():

951

for f, needs in needfiles.iteritems():

940

fl = repo.file(f)

952

fl = repo.file(f)

941

for n in needs:

953

for n in needs:

942

try:

954

try:

943

fl.rev(n)

955

fl.rev(n)

944

except error.LookupError:

956

except error.LookupError:

945

raise error.Abort(

957

raise error.Abort(

946

_('missing file data for %s:%s - run hg verify') %

958

_('missing file data for %s:%s - run hg verify') %

947

(f, hex(n)))

959

(f, hex(n)))

948

960

949

return revisions, files

961

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import tempfile
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from . import (
                 branchmap,
                 dagutil,
                 discovery,
                 error,
                 mdiff,
                 phases,
                 util,
             )
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             bundletypes = {
                 "": ("", None),       # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", None),
                 "HG10BZ": ("HG10", 'BZ'),
                 "HG10GZ": ("HG10GZ", 'GZ'),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 if bundletype == "HG20":
                     from . import bundle2
                     bundle = bundle2.bundle20(ui)
                     bundle.setcompression(compression)
                     part = bundle.newpart('changegroup', data=cg.getchunks())
                     part.addparam('version', cg.version)
                     chunkiter = bundle.getchunks()
                 else:
                     # compression argument is only for the bundle2 case
                     assert compression is None
                     if cg.version != '01':
                         raise error.Abort(_('old bundle types only supports v1 '
                                             'changegroups'))
                     header, comp = bundletypes[bundletype]
                     if comp not in util.compressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                           % comp)
                     z = util.compressors[comp]()
                     subchunkiter = cg.getchunks()
                     def chunkiter():
                         yield header
                         for chunk in subchunkiter:
                             yield z.compress(chunk)
                         yield z.flush()
                     chunkiter = chunkiter()
                 # parse the changegroup data, otherwise we will block
                 # in case of sshrepo because we don't know the end of the stream
                 # an empty chunkgroup is the end of the changegroup
                 # a changegroup has at least 2 chunkgroups (changelog and manifest).
                 # after that, an empty chunkgroup is the end of the changegroup
                 return writechunks(ui, chunkiter, filename, vfs=vfs)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 def __init__(self, fh, alg):
                     if alg == 'UN':
                         alg = None # get more modern without breaking too much
                     if not alg in util.decompressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     self._stream = util.decompressors[alg](fh)
                     self._type = alg
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     return node, p1, p2, deltabase, cs
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, an empty chunkgroup is the end of the changegroup
                     empty = False
                     count = 0
                     while not empty or count <= 2:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     # We know that we'll never have more manifests than we had
                     # changesets.
                     self.callback = prog(_('manifests'), numchanges)
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     repo.manifest.addgroup(self, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                 def apply(self, repo, srctype, url, emptyok=False,
                           targetphase=phases.draft, expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     wasempty = (len(repo.changelog) == 0)
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))
                     try:
                         # The transaction could have been created before and already
                         # carries source information. In this case we use the top
                         # level data. We overwrite the argument because we need to use
                         # the top level value (if they exist) in this function.
                         srctype = tr.hookargs.setdefault('source', srctype)
                         url = tr.hookargs.setdefault('url', url)
                         repo.hook('prechangegroup', throw=True, **tr.hookargs)
                         # write changelog data to temp files so concurrent readers
                         # will not see an inconsistent view
                         cl = repo.changelog
                         cl.delayupdate(tr)
                         oldheads = cl.heads()
                         trp = weakref.proxy(tr)
                         # pull off the changeset group
                         repo.ui.status(_("adding changesets\n"))
                         clstart = len(cl)
                         class prog(object):
                             def __init__(self, step, total):
                                 self._step = step
                                 self._total = total
                                 self._count = 1
                             def __call__(self):
                                 repo.ui.progress(self._step, self._count, unit=_('chunks'),
                                                  total=self._total)
                                 self._count += 1
                         self.callback = prog(_('changesets'), expectedtotal)
                         efiles = set()
                         def onchangelog(cl, node):
                             efiles.update(cl.read(node)[3])
                         self.changelogheader()
                         srccontent = cl.addgroup(self, csmap, trp,
                                                  addrevisioncb=onchangelog)
                         efiles = len(efiles)
                         if not (srccontent or emptyok):
                             raise error.Abort(_("received changelog group is empty"))
                         clend = len(cl)
                         changesets = clend - clstart
                         repo.ui.progress(_('changesets'), None)
                         # pull off the manifest group
                         repo.ui.status(_("adding manifests\n"))
                         self._unpackmanifests(repo, revmap, trp, prog, changesets)
                         needfiles = {}
                         if repo.ui.configbool('server', 'validate', default=False):
                             # validate incoming csets have their manifests
                             for cset in xrange(clstart, clend):
                                 mfnode = repo.changelog.read(repo.changelog.node(cset))[0]
                                 mfest = repo.manifest.readdelta(mfnode)
                                 # store file nodes we must see
                                 for f, n in mfest.iteritems():
                                     needfiles.setdefault(f, set()).add(n)
                         # process the files
                         repo.ui.status(_("adding file changes\n"))
                         self.callback = None
                         pr = prog(_('files'), efiles)
                         newrevs, newfiles = _addchangegroupfiles(
                             repo, self, revmap, trp, pr, needfiles, wasempty)
                         revisions += newrevs
                         files += newfiles
                         dh = 0
                         if oldheads:
                             heads = cl.heads()
                             dh = len(heads) - len(oldheads)
                             for h in heads:
                                 if h not in oldheads and repo[h].closesbranch():
                                     dh -= 1
                         htext = ""
                         if dh:
                             htext = _(" (%+d heads)") % dh
                         repo.ui.status(_("added %d changesets"
                                          " with %d changes to %d files%s\n")
                                          % (changesets, revisions, files, htext))
                         repo.invalidatevolatilesets()
                         if changesets > 0:
                             if 'node' not in tr.hookargs:
                                 tr.hookargs['node'] = hex(cl.node(clstart))
                                 hookargs = dict(tr.hookargs)
                             else:
                                 hookargs = dict(tr.hookargs)
                                 hookargs['node'] = hex(cl.node(clstart))
                             repo.hook('pretxnchangegroup', throw=True, **hookargs)
                         added = [cl.node(r) for r in xrange(clstart, clend)]
                         publishing = repo.publishing()
                         if srctype in ('push', 'serve'):
                             # Old servers can not push the boundary themselves.
                             # New servers won't push the boundary if changeset already
                             # exists locally as secret
                             #
                             # We should not use added here but the list of all change in
                             # the bundle
                             if publishing:
                                 phases.advanceboundary(repo, tr, phases.public, srccontent)
                             else:
                                 # Those changesets have been pushed from the outside, their
                                 # phases are going to be pushed alongside. Therefor
                                 # `targetphase` is ignored.
                                 phases.advanceboundary(repo, tr, phases.draft, srccontent)
                                 phases.retractboundary(repo, tr, phases.draft, added)
                         elif srctype != 'strip':
                             # publishing only alter behavior during push
                             #
                             # strip should not touch boundary at all
                             phases.retractboundary(repo, tr, targetphase, added)
                         if changesets > 0:
                             if srctype != 'strip':
                                 # During strip, branchcache is invalid but coming call to
                                 # `destroyed` will repair it.
                                 # In other case we can safely update cache on disk.
                                 branchmap.updatecache(repo.filtered('served'))
                             def runhooks():
                                 # These hooks run when the lock releases, not when the
                                 # transaction closes. So it's possible for the changelog
                                 # to have changed since we last saw it.
                                 if clstart >= len(repo):
                                     return
                                 # forcefully update the on-disk branch cache
                                 repo.ui.debug("updating the branch cache\n")
                                 repo.hook("changegroup", **hookargs)
                                 for n in added:
                                     args = hookargs.copy()
                                     args['node'] = hex(n)
                                     repo.hook("incoming", **args)
                                 newheads = [h for h in repo.heads() if h not in oldheads]
                                 repo.ui.log("incoming",
                                             "%s incoming changes - new heads: %s\n",
                                             len(added),
                                             ', '.join([hex(c[:6]) for c in newheads]))
                             tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                             lambda tr: repo._afterlock(runhooks))
                         tr.close()
                     finally:
                         tr.release()
                         repo.ui.flush()
                     # never return 0 here:
                     if dh < 0:
                         return dh - 1
                     else:
                         return dh + 1
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     return node, p1, p2, deltabase, cs
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     if units is not None:
                         self._progress(msgbundling, None)
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def _packmanifests(self, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
                     ml = self._repo.manifest
                     size = 0
                     for chunk in self.group(
                             mfnodes, ml, lookuplinknode, units=_('manifests')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     ml = repo.manifest
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     changedfiles = set()
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         changedfiles.update(c[3])
                         # record the first changeset introducing this manifest version
                         mfs.setdefault(c[0], x)
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def lookupmflinknode(x):
+                        """Callback for looking up the linknode for manifests.
+                        Returns the linkrev node for the specified manifest.
+                        SIDE EFFECT:
+                          fclnodes gets populated with the list of relevant
+                          file nodes if we're not using fastpathlinkrev.
+                        Note that this means you can't trust fclnodes until
+                        after manifests have been sent to the client.
+                        """
                         clnode = mfs[x]
                         if not fastpathlinkrev:
                             mdata = ml.readfast(x)
                             for f, n in mdata.iteritems():
                                 if f in changedfiles:
                                     # record the first changeset introducing this filelog
                                     # version
                                     fclnodes = fnodes.setdefault(f, {})
                                     fclnode = fclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[fclnode]:
                                         fclnodes[n] = clnode
                         return clnode
                     mfnodes = self.prune(ml, mfs, commonrevs)
                     for x in self._packmanifests(mfnodes, lookupmflinknode):
                         yield x
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     def linknodes(filerevlog, fname):
                         if fastpathlinkrev:
                             llr = filerevlog.linkrev
                             def genfilenodes():
                                 for r in filerevlog:
                                     linkrev = llr(r)
                                     if linkrev in clrevs:
                                         yield filerevlog.node(r), cl.node(linkrev)
                             return dict(genfilenodes())
                         return fnodes.get(fname, {})
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress(msgbundling, None)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def __init__(self, repo, bundlecaps=None):
                     super(cg2packer, self).__init__(repo, bundlecaps)
                     if self._reorder is None:
                         # Since generaldelta is directly supported by cg2, reordering
                         # generally doesn't help, so we disable it by default (treating
                         # bundle.reorder=auto just like bundle.reorder=False).
                         self._reorder = False
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             packermap = {'01': (cg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (cg2packer, cg2unpacker),
             }
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 included = set(csets)
                 discbases = [n for n in discbases if n not in included]
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = packermap[version][0](repo)
                 return getsubset(repo, outgoing, bundler, source)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,
                                     version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,
                                version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,
                                            version=version)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files