upstream/mercurial-mirror Commit - r27237:c08814b4

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import tempfile

12

import tempfile

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

hex,

17

hex,

18

nullid,

18

nullid,

19

nullrev,

19

nullrev,

20

short,

20

short,

21

)

21

)

22

23

from . import (

23

from . import (

24

branchmap,

24

branchmap,

25

dagutil,

25

dagutil,

26

discovery,

26

discovery,

27

error,

27

error,

28

mdiff,

28

mdiff,

29

phases,

29

phases,

30

util,

30

util,

31

)

31

)

32

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

35

36

def readexactly(stream, n):

36

def readexactly(stream, n):

37

'''read n bytes from stream.read and abort if less was available'''

37

'''read n bytes from stream.read and abort if less was available'''

38

s = stream.read(n)

38

s = stream.read(n)

39

if len(s) < n:

39

if len(s) < n:

40

raise error.Abort(_("stream ended unexpectedly"

40

raise error.Abort(_("stream ended unexpectedly"

41

" (got %d bytes, expected %d)")

41

" (got %d bytes, expected %d)")

42

% (len(s), n))

42

% (len(s), n))

43

return s

43

return s

44

45

def getchunk(stream):

45

def getchunk(stream):

46

"""return the next chunk from stream as a string"""

46

"""return the next chunk from stream as a string"""

47

d = readexactly(stream, 4)

47

d = readexactly(stream, 4)

48

l = struct.unpack(">l", d)[0]

48

l = struct.unpack(">l", d)[0]

49

if l <= 4:

49

if l <= 4:

50

if l:

50

if l:

51

raise error.Abort(_("invalid chunk length %d") % l)

51

raise error.Abort(_("invalid chunk length %d") % l)

52

return ""

52

return ""

53

return readexactly(stream, l - 4)

53

return readexactly(stream, l - 4)

54

55

def chunkheader(length):

55

def chunkheader(length):

56

"""return a changegroup chunk header (string)"""

56

"""return a changegroup chunk header (string)"""

57

return struct.pack(">l", length + 4)

57

return struct.pack(">l", length + 4)

58

59

def closechunk():

59

def closechunk():

60

"""return a changegroup chunk header (string) for a zero-length chunk"""

60

"""return a changegroup chunk header (string) for a zero-length chunk"""

61

return struct.pack(">l", 0)

61

return struct.pack(">l", 0)

62

63

def combineresults(results):

63

def combineresults(results):

64

"""logic to combine 0 or more addchangegroup results into one"""

64

"""logic to combine 0 or more addchangegroup results into one"""

65

changedheads = 0

65

changedheads = 0

66

result = 1

66

result = 1

67

for ret in results:

67

for ret in results:

68

# If any changegroup result is 0, return 0

68

# If any changegroup result is 0, return 0

69

if ret == 0:

69

if ret == 0:

70

result = 0

70

result = 0

71

break

71

break

72

if ret < -1:

72

if ret < -1:

73

changedheads += ret + 1

73

changedheads += ret + 1

74

elif ret > 1:

74

elif ret > 1:

75

changedheads += ret - 1

75

changedheads += ret - 1

76

if changedheads > 0:

76

if changedheads > 0:

77

result = 1 + changedheads

77

result = 1 + changedheads

78

elif changedheads < 0:

78

elif changedheads < 0:

79

result = -1 + changedheads

79

result = -1 + changedheads

80

return result

80

return result

81

82

bundletypes = {

82

bundletypes = {

83

"": ("", None), # only when using unbundle on ssh and old http servers

83

"": ("", None), # only when using unbundle on ssh and old http servers

84

# since the unification ssh accepts a header but there

84

# since the unification ssh accepts a header but there

85

# is no capability signaling it.

85

# is no capability signaling it.

86

"HG20": (), # special-cased below

86

"HG20": (), # special-cased below

87

"HG10UN": ("HG10UN", None),

87

"HG10UN": ("HG10UN", None),

88

"HG10BZ": ("HG10", 'BZ'),

88

"HG10BZ": ("HG10", 'BZ'),

89

"HG10GZ": ("HG10GZ", 'GZ'),

89

"HG10GZ": ("HG10GZ", 'GZ'),

90

}

90

}

91

92

# hgweb uses this list to communicate its preferred type

92

# hgweb uses this list to communicate its preferred type

93

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

93

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

94

95

def writechunks(ui, chunks, filename, vfs=None):

95

def writechunks(ui, chunks, filename, vfs=None):

96

"""Write chunks to a file and return its filename.

96

"""Write chunks to a file and return its filename.

97

98

The stream is assumed to be a bundle file.

98

The stream is assumed to be a bundle file.

99

Existing files will not be overwritten.

99

Existing files will not be overwritten.

100

If no filename is specified, a temporary file is created.

100

If no filename is specified, a temporary file is created.

101

"""

101

"""

102

fh = None

102

fh = None

103

cleanup = None

103

cleanup = None

104

try:

104

try:

105

if filename:

105

if filename:

106

if vfs:

106

if vfs:

107

fh = vfs.open(filename, "wb")

107

fh = vfs.open(filename, "wb")

108

else:

108

else:

109

fh = open(filename, "wb")

109

fh = open(filename, "wb")

110

else:

110

else:

111

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

111

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

112

fh = os.fdopen(fd, "wb")

112

fh = os.fdopen(fd, "wb")

113

cleanup = filename

113

cleanup = filename

114

for c in chunks:

114

for c in chunks:

115

fh.write(c)

115

fh.write(c)

116

cleanup = None

116

cleanup = None

117

return filename

117

return filename

118

finally:

118

finally:

119

if fh is not None:

119

if fh is not None:

120

fh.close()

120

fh.close()

121

if cleanup is not None:

121

if cleanup is not None:

122

if filename and vfs:

122

if filename and vfs:

123

vfs.unlink(cleanup)

123

vfs.unlink(cleanup)

124

else:

124

else:

125

os.unlink(cleanup)

125

os.unlink(cleanup)

126

127

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

127

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

128

"""Write a bundle file and return its filename.

128

"""Write a bundle file and return its filename.

129

130

Existing files will not be overwritten.

130

Existing files will not be overwritten.

131

If no filename is specified, a temporary file is created.

131

If no filename is specified, a temporary file is created.

132

bz2 compression can be turned off.

132

bz2 compression can be turned off.

133

The bundle file will be deleted in case of errors.

133

The bundle file will be deleted in case of errors.

134

"""

134

"""

135

136

if bundletype == "HG20":

136

if bundletype == "HG20":

137

from . import bundle2

137

from . import bundle2

138

bundle = bundle2.bundle20(ui)

138

bundle = bundle2.bundle20(ui)

139

bundle.setcompression(compression)

139

bundle.setcompression(compression)

140

part = bundle.newpart('changegroup', data=cg.getchunks())

140

part = bundle.newpart('changegroup', data=cg.getchunks())

141

part.addparam('version', cg.version)

141

part.addparam('version', cg.version)

142

chunkiter = bundle.getchunks()

142

chunkiter = bundle.getchunks()

143

else:

143

else:

144

# compression argument is only for the bundle2 case

144

# compression argument is only for the bundle2 case

145

assert compression is None

145

assert compression is None

146

if cg.version != '01':

146

if cg.version != '01':

147

raise error.Abort(_('old bundle types only supports v1 '

147

raise error.Abort(_('old bundle types only supports v1 '

148

'changegroups'))

148

'changegroups'))

149

header, comp = bundletypes[bundletype]

149

header, comp = bundletypes[bundletype]

150

if comp not in util.compressors:

150

if comp not in util.compressors:

151

raise error.Abort(_('unknown stream compression type: %s')

151

raise error.Abort(_('unknown stream compression type: %s')

152

% comp)

152

% comp)

153

z = util.compressors[comp]()

153

z = util.compressors[comp]()

154

subchunkiter = cg.getchunks()

154

subchunkiter = cg.getchunks()

155

def chunkiter():

155

def chunkiter():

156

yield header

156

yield header

157

for chunk in subchunkiter:

157

for chunk in subchunkiter:

158

yield z.compress(chunk)

158

yield z.compress(chunk)

159

yield z.flush()

159

yield z.flush()

160

chunkiter = chunkiter()

160

chunkiter = chunkiter()

161

162

# parse the changegroup data, otherwise we will block

162

# parse the changegroup data, otherwise we will block

163

# in case of sshrepo because we don't know the end of the stream

163

# in case of sshrepo because we don't know the end of the stream

164

165

# an empty chunkgroup is the end of the changegroup

165

# an empty chunkgroup is the end of the changegroup

166

# a changegroup has at least 2 chunkgroups (changelog and manifest).

166

# a changegroup has at least 2 chunkgroups (changelog and manifest).

167

# after that, an empty chunkgroup is the end of the changegroup

167

# after that, an empty chunkgroup is the end of the changegroup

168

return writechunks(ui, chunkiter, filename, vfs=vfs)

168

return writechunks(ui, chunkiter, filename, vfs=vfs)

169

170

class cg1unpacker(object):

170

class cg1unpacker(object):

171

"""Unpacker for cg1 changegroup streams.

171

"""Unpacker for cg1 changegroup streams.

172

173

A changegroup unpacker handles the framing of the revision data in

173

A changegroup unpacker handles the framing of the revision data in

174

the wire format. Most consumers will want to use the apply()

174

the wire format. Most consumers will want to use the apply()

175

method to add the changes from the changegroup to a repository.

175

method to add the changes from the changegroup to a repository.

176

177

If you're forwarding a changegroup unmodified to another consumer,

177

If you're forwarding a changegroup unmodified to another consumer,

178

use getchunks(), which returns an iterator of changegroup

178

use getchunks(), which returns an iterator of changegroup

179

chunks. This is mostly useful for cases where you need to know the

179

chunks. This is mostly useful for cases where you need to know the

180

data stream has ended by observing the end of the changegroup.

180

data stream has ended by observing the end of the changegroup.

181

182

deltachunk() is useful only if you're applying delta data. Most

182

deltachunk() is useful only if you're applying delta data. Most

183

consumers should prefer apply() instead.

183

consumers should prefer apply() instead.

184

185

A few other public methods exist. Those are used only for

185

A few other public methods exist. Those are used only for

186

bundlerepo and some debug commands - their use is discouraged.

186

bundlerepo and some debug commands - their use is discouraged.

187

"""

187

"""

188

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

188

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

189

deltaheadersize = struct.calcsize(deltaheader)

189

deltaheadersize = struct.calcsize(deltaheader)

190

version = '01'

190

version = '01'

191

def __init__(self, fh, alg):

191

def __init__(self, fh, alg):

192

if alg == 'UN':

192

if alg == 'UN':

193

alg = None # get more modern without breaking too much

193

alg = None # get more modern without breaking too much

194

if not alg in util.decompressors:

194

if not alg in util.decompressors:

195

raise error.Abort(_('unknown stream compression type: %s')

195

raise error.Abort(_('unknown stream compression type: %s')

196

% alg)

196

% alg)

197

if alg == 'BZ':

197

if alg == 'BZ':

198

alg = '_truncatedBZ'

198

alg = '_truncatedBZ'

199

self._stream = util.decompressors[alg](fh)

199

self._stream = util.decompressors[alg](fh)

200

self._type = alg

200

self._type = alg

201

self.callback = None

201

self.callback = None

202

203

# These methods (compressed, read, seek, tell) all appear to only

203

# These methods (compressed, read, seek, tell) all appear to only

204

# be used by bundlerepo, but it's a little hard to tell.

204

# be used by bundlerepo, but it's a little hard to tell.

205

def compressed(self):

205

def compressed(self):

206

return self._type is not None

206

return self._type is not None

207

def read(self, l):

207

def read(self, l):

208

return self._stream.read(l)

208

return self._stream.read(l)

209

def seek(self, pos):

209

def seek(self, pos):

210

return self._stream.seek(pos)

210

return self._stream.seek(pos)

211

def tell(self):

211

def tell(self):

212

return self._stream.tell()

212

return self._stream.tell()

213

def close(self):

213

def close(self):

214

return self._stream.close()

214

return self._stream.close()

215

216

def _chunklength(self):

216

def _chunklength(self):

217

d = readexactly(self._stream, 4)

217

d = readexactly(self._stream, 4)

218

l = struct.unpack(">l", d)[0]

218

l = struct.unpack(">l", d)[0]

219

if l <= 4:

219

if l <= 4:

220

if l:

220

if l:

221

raise error.Abort(_("invalid chunk length %d") % l)

221

raise error.Abort(_("invalid chunk length %d") % l)

222

return 0

222

return 0

223

if self.callback:

223

if self.callback:

224

self.callback()

224

self.callback()

225

return l - 4

225

return l - 4

226

227

def changelogheader(self):

227

def changelogheader(self):

228

"""v10 does not have a changelog header chunk"""

228

"""v10 does not have a changelog header chunk"""

229

return {}

229

return {}

230

231

def manifestheader(self):

231

def manifestheader(self):

232

"""v10 does not have a manifest header chunk"""

232

"""v10 does not have a manifest header chunk"""

233

return {}

233

return {}

234

235

def filelogheader(self):

235

def filelogheader(self):

236

"""return the header of the filelogs chunk, v10 only has the filename"""

236

"""return the header of the filelogs chunk, v10 only has the filename"""

237

l = self._chunklength()

237

l = self._chunklength()

238

if not l:

238

if not l:

239

return {}

239

return {}

240

fname = readexactly(self._stream, l)

240

fname = readexactly(self._stream, l)

241

return {'filename': fname}

241

return {'filename': fname}

242

243

def _deltaheader(self, headertuple, prevnode):

243

def _deltaheader(self, headertuple, prevnode):

244

node, p1, p2, cs = headertuple

244

node, p1, p2, cs = headertuple

245

if prevnode is None:

245

if prevnode is None:

246

deltabase = p1

246

deltabase = p1

247

else:

247

else:

248

deltabase = prevnode

248

deltabase = prevnode

249

return node, p1, p2, deltabase, cs

249

return node, p1, p2, deltabase, cs

250

251

def deltachunk(self, prevnode):

251

def deltachunk(self, prevnode):

252

l = self._chunklength()

252

l = self._chunklength()

253

if not l:

253

if not l:

254

return {}

254

return {}

255

headerdata = readexactly(self._stream, self.deltaheadersize)

255

headerdata = readexactly(self._stream, self.deltaheadersize)

256

header = struct.unpack(self.deltaheader, headerdata)

256

header = struct.unpack(self.deltaheader, headerdata)

257

delta = readexactly(self._stream, l - self.deltaheadersize)

257

delta = readexactly(self._stream, l - self.deltaheadersize)

258

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

258

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

259

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

259

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

260

'deltabase': deltabase, 'delta': delta}

260

'deltabase': deltabase, 'delta': delta}

261

262

def getchunks(self):

262

def getchunks(self):

263

"""returns all the chunks contains in the bundle

263

"""returns all the chunks contains in the bundle

264

265

Used when you need to forward the binary stream to a file or another

265

Used when you need to forward the binary stream to a file or another

266

network API. To do so, it parse the changegroup data, otherwise it will

266

network API. To do so, it parse the changegroup data, otherwise it will

267

block in case of sshrepo because it don't know the end of the stream.

267

block in case of sshrepo because it don't know the end of the stream.

268

"""

268

"""

269

# an empty chunkgroup is the end of the changegroup

269

# an empty chunkgroup is the end of the changegroup

270

# a changegroup has at least 2 chunkgroups (changelog and manifest).

270

# a changegroup has at least 2 chunkgroups (changelog and manifest).

271

# after that, an empty chunkgroup is the end of the changegroup

271

# after that, an empty chunkgroup is the end of the changegroup

272

empty = False

272

empty = False

273

count = 0

273

count = 0

274

while not empty or count <= 2:

274

while not empty or count <= 2:

275

empty = True

275

empty = True

276

count += 1

276

count += 1

277

while True:

277

while True:

278

chunk = getchunk(self)

278

chunk = getchunk(self)

279

if not chunk:

279

if not chunk:

280

break

280

break

281

empty = False

281

empty = False

282

yield chunkheader(len(chunk))

282

yield chunkheader(len(chunk))

283

pos = 0

283

pos = 0

284

while pos < len(chunk):

284

while pos < len(chunk):

285

next = pos + 2**20

285

next = pos + 2**20

286

yield chunk[pos:next]

286

yield chunk[pos:next]

287

pos = next

287

pos = next

288

yield closechunk()

288

yield closechunk()

289

290

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

290

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

291

# We know that we'll never have more manifests than we had

291

# We know that we'll never have more manifests than we had

292

# changesets.

292

# changesets.

293

self.callback = prog(_('manifests'), numchanges)

293

self.callback = prog(_('manifests'), numchanges)

294

# no need to check for empty manifest group here:

294

# no need to check for empty manifest group here:

295

# if the result of the merge of 1 and 2 is the same in 3 and 4,

295

# if the result of the merge of 1 and 2 is the same in 3 and 4,

296

# no new manifest will be created and the manifest group will

296

# no new manifest will be created and the manifest group will

297

# be empty during the pull

297

# be empty during the pull

298

self.manifestheader()

298

self.manifestheader()

299

repo.manifest.addgroup(self, revmap, trp)

299

repo.manifest.addgroup(self, revmap, trp)

300

repo.ui.progress(_('manifests'), None)

300

repo.ui.progress(_('manifests'), None)

301

302

def apply(self, repo, srctype, url, emptyok=False,

302

def apply(self, repo, srctype, url, emptyok=False,

303

targetphase=phases.draft, expectedtotal=None):

303

targetphase=phases.draft, expectedtotal=None):

304

"""Add the changegroup returned by source.read() to this repo.

304

"""Add the changegroup returned by source.read() to this repo.

305

srctype is a string like 'push', 'pull', or 'unbundle'. url is

305

srctype is a string like 'push', 'pull', or 'unbundle'. url is

306

the URL of the repo where this changegroup is coming from.

306

the URL of the repo where this changegroup is coming from.

307

308

Return an integer summarizing the change to this repo:

308

Return an integer summarizing the change to this repo:

309

- nothing changed or no source: 0

309

- nothing changed or no source: 0

310

- more heads than before: 1+added heads (2..n)

310

- more heads than before: 1+added heads (2..n)

311

- fewer heads than before: -1-removed heads (-2..-n)

311

- fewer heads than before: -1-removed heads (-2..-n)

312

- number of heads stays the same: 1

312

- number of heads stays the same: 1

313

"""

313

"""

314

repo = repo.unfiltered()

314

repo = repo.unfiltered()

315

wasempty = (len(repo.changelog) == 0)

315

wasempty = (len(repo.changelog) == 0)

316

def csmap(x):

316

def csmap(x):

317

repo.ui.debug("add changeset %s\n" % short(x))

317

repo.ui.debug("add changeset %s\n" % short(x))

318

return len(cl)

318

return len(cl)

319

320

def revmap(x):

320

def revmap(x):

321

return cl.rev(x)

321

return cl.rev(x)

322

323

changesets = files = revisions = 0

323

changesets = files = revisions = 0

324

325

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

325

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

326

try:

326

try:

327

# The transaction could have been created before and already

327

# The transaction could have been created before and already

328

# carries source information. In this case we use the top

328

# carries source information. In this case we use the top

329

# level data. We overwrite the argument because we need to use

329

# level data. We overwrite the argument because we need to use

330

# the top level value (if they exist) in this function.

330

# the top level value (if they exist) in this function.

331

srctype = tr.hookargs.setdefault('source', srctype)

331

srctype = tr.hookargs.setdefault('source', srctype)

332

url = tr.hookargs.setdefault('url', url)

332

url = tr.hookargs.setdefault('url', url)

333

repo.hook('prechangegroup', throw=True, **tr.hookargs)

333

repo.hook('prechangegroup', throw=True, **tr.hookargs)

334

335

# write changelog data to temp files so concurrent readers

335

# write changelog data to temp files so concurrent readers

336

# will not see an inconsistent view

336

# will not see an inconsistent view

337

cl = repo.changelog

337

cl = repo.changelog

338

cl.delayupdate(tr)

338

cl.delayupdate(tr)

339

oldheads = cl.heads()

339

oldheads = cl.heads()

340

341

trp = weakref.proxy(tr)

341

trp = weakref.proxy(tr)

342

# pull off the changeset group

342

# pull off the changeset group

343

repo.ui.status(_("adding changesets\n"))

343

repo.ui.status(_("adding changesets\n"))

344

clstart = len(cl)

344

clstart = len(cl)

345

class prog(object):

345

class prog(object):

346

def __init__(self, step, total):

346

def __init__(self, step, total):

347

self._step = step

347

self._step = step

348

self._total = total

348

self._total = total

349

self._count = 1

349

self._count = 1

350

def __call__(self):

350

def __call__(self):

351

repo.ui.progress(self._step, self._count, unit=_('chunks'),

351

repo.ui.progress(self._step, self._count, unit=_('chunks'),

352

total=self._total)

352

total=self._total)

353

self._count += 1

353

self._count += 1

354

self.callback = prog(_('changesets'), expectedtotal)

354

self.callback = prog(_('changesets'), expectedtotal)

355

356

efiles = set()

356

efiles = set()

357

def onchangelog(cl, node):

357

def onchangelog(cl, node):

358

efiles.update(cl.read(node)[3])

358

efiles.update(cl.read(node)[3])

359

360

self.changelogheader()

360

self.changelogheader()

361

srccontent = cl.addgroup(self, csmap, trp,

361

srccontent = cl.addgroup(self, csmap, trp,

362

addrevisioncb=onchangelog)

362

addrevisioncb=onchangelog)

363

efiles = len(efiles)

363

efiles = len(efiles)

364

365

if not (srccontent or emptyok):

365

if not (srccontent or emptyok):

366

raise error.Abort(_("received changelog group is empty"))

366

raise error.Abort(_("received changelog group is empty"))

367

clend = len(cl)

367

clend = len(cl)

368

changesets = clend - clstart

368

changesets = clend - clstart

369

repo.ui.progress(_('changesets'), None)

369

repo.ui.progress(_('changesets'), None)

370

371

# pull off the manifest group

371

# pull off the manifest group

372

repo.ui.status(_("adding manifests\n"))

372

repo.ui.status(_("adding manifests\n"))

373

self._unpackmanifests(repo, revmap, trp, prog, changesets)

373

self._unpackmanifests(repo, revmap, trp, prog, changesets)

374

375

needfiles = {}

375

needfiles = {}

376

if repo.ui.configbool('server', 'validate', default=False):

376

if repo.ui.configbool('server', 'validate', default=False):

377

# validate incoming csets have their manifests

377

# validate incoming csets have their manifests

378

for cset in xrange(clstart, clend):

378

for cset in xrange(clstart, clend):

379

mfnode = repo.changelog.read(repo.changelog.node(cset))[0]

379

mfnode = repo.changelog.read(repo.changelog.node(cset))[0]

380

mfest = repo.manifest.readdelta(mfnode)

380

mfest = repo.manifest.readdelta(mfnode)

381

# store file nodes we must see

381

# store file nodes we must see

382

for f, n in mfest.iteritems():

382

for f, n in mfest.iteritems():

383

needfiles.setdefault(f, set()).add(n)

383

needfiles.setdefault(f, set()).add(n)

384

385

# process the files

385

# process the files

386

repo.ui.status(_("adding file changes\n"))

386

repo.ui.status(_("adding file changes\n"))

387

self.callback = None

387

self.callback = None

388

pr = prog(_('files'), efiles)

388

pr = prog(_('files'), efiles)

389

newrevs, newfiles = _addchangegroupfiles(

389

newrevs, newfiles = _addchangegroupfiles(

390

repo, self, revmap, trp, pr, needfiles, wasempty)

390

repo, self, revmap, trp, pr, needfiles, wasempty)

391

revisions += newrevs

391

revisions += newrevs

392

files += newfiles

392

files += newfiles

393

394

dh = 0

394

dh = 0

395

if oldheads:

395

if oldheads:

396

heads = cl.heads()

396

heads = cl.heads()

397

dh = len(heads) - len(oldheads)

397

dh = len(heads) - len(oldheads)

398

for h in heads:

398

for h in heads:

399

if h not in oldheads and repo[h].closesbranch():

399

if h not in oldheads and repo[h].closesbranch():

400

dh -= 1

400

dh -= 1

401

htext = ""

401

htext = ""

402

if dh:

402

if dh:

403

htext = _(" (%+d heads)") % dh

403

htext = _(" (%+d heads)") % dh

404

405

repo.ui.status(_("added %d changesets"

405

repo.ui.status(_("added %d changesets"

406

" with %d changes to %d files%s\n")

406

" with %d changes to %d files%s\n")

407

% (changesets, revisions, files, htext))

407

% (changesets, revisions, files, htext))

408

repo.invalidatevolatilesets()

408

repo.invalidatevolatilesets()

409

410

if changesets > 0:

410

if changesets > 0:

411

if 'node' not in tr.hookargs:

411

if 'node' not in tr.hookargs:

412

tr.hookargs['node'] = hex(cl.node(clstart))

412

tr.hookargs['node'] = hex(cl.node(clstart))

413

hookargs = dict(tr.hookargs)

413

hookargs = dict(tr.hookargs)

414

else:

414

else:

415

hookargs = dict(tr.hookargs)

415

hookargs = dict(tr.hookargs)

416

hookargs['node'] = hex(cl.node(clstart))

416

hookargs['node'] = hex(cl.node(clstart))

417

repo.hook('pretxnchangegroup', throw=True, **hookargs)

417

repo.hook('pretxnchangegroup', throw=True, **hookargs)

418

419

added = [cl.node(r) for r in xrange(clstart, clend)]

419

added = [cl.node(r) for r in xrange(clstart, clend)]

420

publishing = repo.publishing()

420

publishing = repo.publishing()

421

if srctype in ('push', 'serve'):

421

if srctype in ('push', 'serve'):

422

# Old servers can not push the boundary themselves.

422

# Old servers can not push the boundary themselves.

423

# New servers won't push the boundary if changeset already

423

# New servers won't push the boundary if changeset already

424

# exists locally as secret

424

# exists locally as secret

425

#

425

#

426

# We should not use added here but the list of all change in

426

# We should not use added here but the list of all change in

427

# the bundle

427

# the bundle

428

if publishing:

428

if publishing:

429

phases.advanceboundary(repo, tr, phases.public, srccontent)

429

phases.advanceboundary(repo, tr, phases.public, srccontent)

430

else:

430

else:

431

# Those changesets have been pushed from the outside, their

431

# Those changesets have been pushed from the outside, their

432

# phases are going to be pushed alongside. Therefor

432

# phases are going to be pushed alongside. Therefor

433

# `targetphase` is ignored.

433

# `targetphase` is ignored.

434

phases.advanceboundary(repo, tr, phases.draft, srccontent)

434

phases.advanceboundary(repo, tr, phases.draft, srccontent)

435

phases.retractboundary(repo, tr, phases.draft, added)

435

phases.retractboundary(repo, tr, phases.draft, added)

436

elif srctype != 'strip':

436

elif srctype != 'strip':

437

# publishing only alter behavior during push

437

# publishing only alter behavior during push

438

#

438

#

439

# strip should not touch boundary at all

439

# strip should not touch boundary at all

440

phases.retractboundary(repo, tr, targetphase, added)

440

phases.retractboundary(repo, tr, targetphase, added)

441

442

if changesets > 0:

442

if changesets > 0:

443

if srctype != 'strip':

443

if srctype != 'strip':

444

# During strip, branchcache is invalid but coming call to

444

# During strip, branchcache is invalid but coming call to

445

# `destroyed` will repair it.

445

# `destroyed` will repair it.

446

# In other case we can safely update cache on disk.

446

# In other case we can safely update cache on disk.

447

branchmap.updatecache(repo.filtered('served'))

447

branchmap.updatecache(repo.filtered('served'))

448

449

def runhooks():

449

def runhooks():

450

# These hooks run when the lock releases, not when the

450

# These hooks run when the lock releases, not when the

451

# transaction closes. So it's possible for the changelog

451

# transaction closes. So it's possible for the changelog

452

# to have changed since we last saw it.

452

# to have changed since we last saw it.

453

if clstart >= len(repo):

453

if clstart >= len(repo):

454

return

454

return

455

456

# forcefully update the on-disk branch cache

456

# forcefully update the on-disk branch cache

457

repo.ui.debug("updating the branch cache\n")

457

repo.ui.debug("updating the branch cache\n")

458

repo.hook("changegroup", **hookargs)

458

repo.hook("changegroup", **hookargs)

459

460

for n in added:

460

for n in added:

461

args = hookargs.copy()

461

args = hookargs.copy()

462

args['node'] = hex(n)

462

args['node'] = hex(n)

463

repo.hook("incoming", **args)

463

repo.hook("incoming", **args)

464

465

newheads = [h for h in repo.heads() if h not in oldheads]

465

newheads = [h for h in repo.heads() if h not in oldheads]

466

repo.ui.log("incoming",

466

repo.ui.log("incoming",

467

"%s incoming changes - new heads: %s\n",

467

"%s incoming changes - new heads: %s\n",

468

len(added),

468

len(added),

469

', '.join([hex(c[:6]) for c in newheads]))

469

', '.join([hex(c[:6]) for c in newheads]))

470

471

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

471

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

472

lambda tr: repo._afterlock(runhooks))

472

lambda tr: repo._afterlock(runhooks))

473

474

tr.close()

474

tr.close()

475

476

finally:

476

finally:

477

tr.release()

477

tr.release()

478

repo.ui.flush()

478

repo.ui.flush()

479

# never return 0 here:

479

# never return 0 here:

480

if dh < 0:

480

if dh < 0:

481

return dh - 1

481

return dh - 1

482

else:

482

else:

483

return dh + 1

483

return dh + 1

484

485

class cg2unpacker(cg1unpacker):

485

class cg2unpacker(cg1unpacker):

486

"""Unpacker for cg2 streams.

486

"""Unpacker for cg2 streams.

487

488

cg2 streams add support for generaldelta, so the delta header

488

cg2 streams add support for generaldelta, so the delta header

489

format is slightly different. All other features about the data

489

format is slightly different. All other features about the data

490

remain the same.

490

remain the same.

491

"""

491

"""

492

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

492

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

493

deltaheadersize = struct.calcsize(deltaheader)

493

deltaheadersize = struct.calcsize(deltaheader)

494

version = '02'

494

version = '02'

495

496

def _deltaheader(self, headertuple, prevnode):

496

def _deltaheader(self, headertuple, prevnode):

497

node, p1, p2, deltabase, cs = headertuple

497

node, p1, p2, deltabase, cs = headertuple

498

return node, p1, p2, deltabase, cs

498

return node, p1, p2, deltabase, cs

499

500

class headerlessfixup(object):

500

class headerlessfixup(object):

501

def __init__(self, fh, h):

501

def __init__(self, fh, h):

502

self._h = h

502

self._h = h

503

self._fh = fh

503

self._fh = fh

504

def read(self, n):

504

def read(self, n):

505

if self._h:

505

if self._h:

506

d, self._h = self._h[:n], self._h[n:]

506

d, self._h = self._h[:n], self._h[n:]

507

if len(d) < n:

507

if len(d) < n:

508

d += readexactly(self._fh, n - len(d))

508

d += readexactly(self._fh, n - len(d))

509

return d

509

return d

510

return readexactly(self._fh, n)

510

return readexactly(self._fh, n)

511

512

class cg1packer(object):

512

class cg1packer(object):

513

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

513

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

514

version = '01'

514

version = '01'

515

def __init__(self, repo, bundlecaps=None):

515

def __init__(self, repo, bundlecaps=None):

516

"""Given a source repo, construct a bundler.

516

"""Given a source repo, construct a bundler.

517

518

bundlecaps is optional and can be used to specify the set of

518

bundlecaps is optional and can be used to specify the set of

519

capabilities which can be used to build the bundle.

519

capabilities which can be used to build the bundle.

520

"""

520

"""

521

# Set of capabilities we can use to build the bundle.

521

# Set of capabilities we can use to build the bundle.

522

if bundlecaps is None:

522

if bundlecaps is None:

523

bundlecaps = set()

523

bundlecaps = set()

524

self._bundlecaps = bundlecaps

524

self._bundlecaps = bundlecaps

525

# experimental config: bundle.reorder

525

# experimental config: bundle.reorder

526

reorder = repo.ui.config('bundle', 'reorder', 'auto')

526

reorder = repo.ui.config('bundle', 'reorder', 'auto')

527

if reorder == 'auto':

527

if reorder == 'auto':

528

reorder = None

528

reorder = None

529

else:

529

else:

530

reorder = util.parsebool(reorder)

530

reorder = util.parsebool(reorder)

531

self._repo = repo

531

self._repo = repo

532

self._reorder = reorder

532

self._reorder = reorder

533

self._progress = repo.ui.progress

533

self._progress = repo.ui.progress

534

if self._repo.ui.verbose and not self._repo.ui.debugflag:

534

if self._repo.ui.verbose and not self._repo.ui.debugflag:

535

self._verbosenote = self._repo.ui.note

535

self._verbosenote = self._repo.ui.note

536

else:

536

else:

537

self._verbosenote = lambda s: None

537

self._verbosenote = lambda s: None

538

539

def close(self):

539

def close(self):

540

return closechunk()

540

return closechunk()

541

542

def fileheader(self, fname):

542

def fileheader(self, fname):

543

return chunkheader(len(fname)) + fname

543

return chunkheader(len(fname)) + fname

544

545

def group(self, nodelist, revlog, lookup, units=None):

545

def group(self, nodelist, revlog, lookup, units=None):

546

"""Calculate a delta group, yielding a sequence of changegroup chunks

546

"""Calculate a delta group, yielding a sequence of changegroup chunks

547

(strings).

547

(strings).

548

549

Given a list of changeset revs, return a set of deltas and

549

Given a list of changeset revs, return a set of deltas and

550

metadata corresponding to nodes. The first delta is

550

metadata corresponding to nodes. The first delta is

551

first parent(nodelist[0]) -> nodelist[0], the receiver is

551

first parent(nodelist[0]) -> nodelist[0], the receiver is

552

guaranteed to have this parent as it has all history before

552

guaranteed to have this parent as it has all history before

553

these changesets. In the case firstparent is nullrev the

553

these changesets. In the case firstparent is nullrev the

554

changegroup starts with a full revision.

554

changegroup starts with a full revision.

555

556

If units is not None, progress detail will be generated, units specifies

556

If units is not None, progress detail will be generated, units specifies

557

the type of revlog that is touched (changelog, manifest, etc.).

557

the type of revlog that is touched (changelog, manifest, etc.).

558

"""

558

"""

559

# if we don't have any revisions touched by these changesets, bail

559

# if we don't have any revisions touched by these changesets, bail

560

if len(nodelist) == 0:

560

if len(nodelist) == 0:

561

yield self.close()

561

yield self.close()

562

return

562

return

563

564

# for generaldelta revlogs, we linearize the revs; this will both be

564

# for generaldelta revlogs, we linearize the revs; this will both be

565

# much quicker and generate a much smaller bundle

565

# much quicker and generate a much smaller bundle

566

if (revlog._generaldelta and self._reorder is None) or self._reorder:

566

if (revlog._generaldelta and self._reorder is None) or self._reorder:

567

dag = dagutil.revlogdag(revlog)

567

dag = dagutil.revlogdag(revlog)

568

revs = set(revlog.rev(n) for n in nodelist)

568

revs = set(revlog.rev(n) for n in nodelist)

569

revs = dag.linearize(revs)

569

revs = dag.linearize(revs)

570

else:

570

else:

571

revs = sorted([revlog.rev(n) for n in nodelist])

571

revs = sorted([revlog.rev(n) for n in nodelist])

572

573

# add the parent of the first rev

573

# add the parent of the first rev

574

p = revlog.parentrevs(revs[0])[0]

574

p = revlog.parentrevs(revs[0])[0]

575

revs.insert(0, p)

575

revs.insert(0, p)

576

577

# build deltas

577

# build deltas

578

total = len(revs) - 1

578

total = len(revs) - 1

579

msgbundling = _('bundling')

579

msgbundling = _('bundling')

580

for r in xrange(len(revs) - 1):

580

for r in xrange(len(revs) - 1):

581

if units is not None:

581

if units is not None:

582

self._progress(msgbundling, r + 1, unit=units, total=total)

582

self._progress(msgbundling, r + 1, unit=units, total=total)

583

prev, curr = revs[r], revs[r + 1]

583

prev, curr = revs[r], revs[r + 1]

584

linknode = lookup(revlog.node(curr))

584

linknode = lookup(revlog.node(curr))

585

for c in self.revchunk(revlog, curr, prev, linknode):

585

for c in self.revchunk(revlog, curr, prev, linknode):

586

yield c

586

yield c

587

588

if units is not None:

588

if units is not None:

589

self._progress(msgbundling, None)

589

self._progress(msgbundling, None)

590

yield self.close()

590

yield self.close()

591

592

# filter any nodes that claim to be part of the known set

592

# filter any nodes that claim to be part of the known set

593

def prune(self, revlog, missing, commonrevs):

593

def prune(self, revlog, missing, commonrevs):

594

rr, rl = revlog.rev, revlog.linkrev

594

rr, rl = revlog.rev, revlog.linkrev

595

return [n for n in missing if rl(rr(n)) not in commonrevs]

595

return [n for n in missing if rl(rr(n)) not in commonrevs]

596

597

def _packmanifests(self, mfnodes, lookuplinknode):

597

def _packmanifests(self, mfnodes, lookuplinknode):

598

"""Pack flat manifests into a changegroup stream."""

598

"""Pack flat manifests into a changegroup stream."""

599

ml = self._repo.manifest

599

ml = self._repo.manifest

600

size = 0

600

size = 0

601

for chunk in self.group(

601

for chunk in self.group(

602

mfnodes, ml, lookuplinknode, units=_('manifests')):

602

mfnodes, ml, lookuplinknode, units=_('manifests')):

603

size += len(chunk)

603

size += len(chunk)

604

yield chunk

604

yield chunk

605

self._verbosenote(_('%8.i (manifests)\n') % size)

605

self._verbosenote(_('%8.i (manifests)\n') % size)

606

607

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

607

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

608

'''yield a sequence of changegroup chunks (strings)'''

608

'''yield a sequence of changegroup chunks (strings)'''

609

repo = self._repo

609

repo = self._repo

610

cl = repo.changelog

610

cl = repo.changelog

611

ml = repo.manifest

611

ml = repo.manifest

612

613

clrevorder = {}

613

clrevorder = {}

614

mfs = {} # needed manifests

614

mfs = {} # needed manifests

615

fnodes = {} # needed file nodes

615

fnodes = {} # needed file nodes

616

changedfiles = set()

616

# maps manifest node id -> set(changed files)

617

mfchangedfiles = {}

617

618

# Callback for the changelog, used to collect changed files and manifest

619

# Callback for the changelog, used to collect changed files and manifest

619

# nodes.

620

# nodes.

620

# Returns the linkrev node (identity in the changelog case).

621

# Returns the linkrev node (identity in the changelog case).

621

def lookupcl(x):

622

def lookupcl(x):

622

c = cl.read(x)

623

c = cl.read(x)

623

clrevorder[x] = len(clrevorder)

624

clrevorder[x] = len(clrevorder)

624

changedfiles.update(c[3])

625

n = c[0]

625

# record the first changeset introducing this manifest version

626

# record the first changeset introducing this manifest version

626

mfs.setdefault(c[0], x)

627

mfs.setdefault(n, x)

628

# Record a complete list of potentially-changed files in

629

# this manifest.

630

mfchangedfiles.setdefault(n, set()).update(c[3])

627

return x

631

return x

628

632

629

self._verbosenote(_('uncompressed size of bundle content:\n'))

633

self._verbosenote(_('uncompressed size of bundle content:\n'))

630

size = 0

634

size = 0

631

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

635

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

632

size += len(chunk)

636

size += len(chunk)

633

yield chunk

637

yield chunk

634

self._verbosenote(_('%8.i (changelog)\n') % size)

638

self._verbosenote(_('%8.i (changelog)\n') % size)

635

639

636

# We need to make sure that the linkrev in the changegroup refers to

640

# We need to make sure that the linkrev in the changegroup refers to

637

# the first changeset that introduced the manifest or file revision.

641

# the first changeset that introduced the manifest or file revision.

638

# The fastpath is usually safer than the slowpath, because the filelogs

642

# The fastpath is usually safer than the slowpath, because the filelogs

639

# are walked in revlog order.

643

# are walked in revlog order.

640

#

644

#

641

# When taking the slowpath with reorder=None and the manifest revlog

645

# When taking the slowpath with reorder=None and the manifest revlog

642

# uses generaldelta, the manifest may be walked in the "wrong" order.

646

# uses generaldelta, the manifest may be walked in the "wrong" order.

643

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

647

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

644

# cc0ff93d0c0c).

648

# cc0ff93d0c0c).

645

#

649

#

646

# When taking the fastpath, we are only vulnerable to reordering

650

# When taking the fastpath, we are only vulnerable to reordering

647

# of the changelog itself. The changelog never uses generaldelta, so

651

# of the changelog itself. The changelog never uses generaldelta, so

648

# it is only reordered when reorder=True. To handle this case, we

652

# it is only reordered when reorder=True. To handle this case, we

649

# simply take the slowpath, which already has the 'clrevorder' logic.

653

# simply take the slowpath, which already has the 'clrevorder' logic.

650

# This was also fixed in cc0ff93d0c0c.

654

# This was also fixed in cc0ff93d0c0c.

651

fastpathlinkrev = fastpathlinkrev and not self._reorder

655

fastpathlinkrev = fastpathlinkrev and not self._reorder

652

# Callback for the manifest, used to collect linkrevs for filelog

656

# Callback for the manifest, used to collect linkrevs for filelog

653

# revisions.

657

# revisions.

654

# Returns the linkrev node (collected in lookupcl).

658

# Returns the linkrev node (collected in lookupcl).

655

def lookupmflinknode(x):

659

def lookupmflinknode(x):

656

"""Callback for looking up the linknode for manifests.

660

"""Callback for looking up the linknode for manifests.

657

661

658

Returns the linkrev node for the specified manifest.

662

Returns the linkrev node for the specified manifest.

659

663

660

SIDE EFFECT:

664

SIDE EFFECT:

661

665

662

fclnodes gets populated with the list of relevant

666

fclnodes gets populated with the list of relevant

663

file nodes if we're not using fastpathlinkrev.

667

file nodes if we're not using fastpathlinkrev.

664

668

665

Note that this means you can't trust fclnodes until

669

Note that this means you can't trust fclnodes until

666

after manifests have been sent to the client.

670

after manifests have been sent to the client.

667

"""

671

"""

668

clnode = mfs[x]

672

clnode = mfs[x]

669

if not fastpathlinkrev:

673

if not fastpathlinkrev:

670

mdata = ml.readfast(x)

674

mdata = ml.readfast(x)

671

for f, n in m~~data~~.~~iteritems~~():

675

for f in mfchangedfiles[x]:

672

if f in ~~changedfiles~~:

676

if True:

677

try:

678

n = mdata[f]

679

except KeyError:

680

continue

673

# record the first changeset introducing this filelog

681

# record the first changeset introducing this filelog

674

# version

682

# version

675

fclnodes = fnodes.setdefault(f, {})

683

fclnodes = fnodes.setdefault(f, {})

676

fclnode = fclnodes.setdefault(n, clnode)

684

fclnode = fclnodes.setdefault(n, clnode)

677

if clrevorder[clnode] < clrevorder[fclnode]:

685

if clrevorder[clnode] < clrevorder[fclnode]:

678

fclnodes[n] = clnode

686

fclnodes[n] = clnode

679

return clnode

687

return clnode

680

688

681

mfnodes = self.prune(ml, mfs, commonrevs)

689

mfnodes = self.prune(ml, mfs, commonrevs)

682

for x in self._packmanifests(mfnodes, lookupmflinknode):

690

for x in self._packmanifests(mfnodes, lookupmflinknode):

683

yield x

691

yield x

684

692

685

mfs.clear()

693

mfs.clear()

686

clrevs = set(cl.rev(x) for x in clnodes)

694

clrevs = set(cl.rev(x) for x in clnodes)

687

695

688

def linknodes(filerevlog, fname):

696

def linknodes(filerevlog, fname):

689

if fastpathlinkrev:

697

if fastpathlinkrev:

690

llr = filerevlog.linkrev

698

llr = filerevlog.linkrev

691

def genfilenodes():

699

def genfilenodes():

692

for r in filerevlog:

700

for r in filerevlog:

693

linkrev = llr(r)

701

linkrev = llr(r)

694

if linkrev in clrevs:

702

if linkrev in clrevs:

695

yield filerevlog.node(r), cl.node(linkrev)

703

yield filerevlog.node(r), cl.node(linkrev)

696

return dict(genfilenodes())

704

return dict(genfilenodes())

697

return fnodes.get(fname, {})

705

return fnodes.get(fname, {})

698

706

707

changedfiles = set()

708

for x in mfchangedfiles.itervalues():

709

changedfiles.update(x)

699

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

710

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

700

source):

711

source):

701

yield chunk

712

yield chunk

702

713

703

yield self.close()

714

yield self.close()

704

715

705

if clnodes:

716

if clnodes:

706

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

717

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

707

718

708

# The 'source' parameter is useful for extensions

719

# The 'source' parameter is useful for extensions

709

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

720

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

710

repo = self._repo

721

repo = self._repo

711

progress = self._progress

722

progress = self._progress

712

msgbundling = _('bundling')

723

msgbundling = _('bundling')

713

724

714

total = len(changedfiles)

725

total = len(changedfiles)

715

# for progress output

726

# for progress output

716

msgfiles = _('files')

727

msgfiles = _('files')

717

for i, fname in enumerate(sorted(changedfiles)):

728

for i, fname in enumerate(sorted(changedfiles)):

718

filerevlog = repo.file(fname)

729

filerevlog = repo.file(fname)

719

if not filerevlog:

730

if not filerevlog:

720

raise error.Abort(_("empty or missing revlog for %s") % fname)

731

raise error.Abort(_("empty or missing revlog for %s") % fname)

721

732

722

linkrevnodes = linknodes(filerevlog, fname)

733

linkrevnodes = linknodes(filerevlog, fname)

723

# Lookup for filenodes, we collected the linkrev nodes above in the

734

# Lookup for filenodes, we collected the linkrev nodes above in the

724

# fastpath case and with lookupmf in the slowpath case.

735

# fastpath case and with lookupmf in the slowpath case.

725

def lookupfilelog(x):

736

def lookupfilelog(x):

726

return linkrevnodes[x]

737

return linkrevnodes[x]

727

738

728

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

739

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

729

if filenodes:

740

if filenodes:

730

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

741

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

731

total=total)

742

total=total)

732

h = self.fileheader(fname)

743

h = self.fileheader(fname)

733

size = len(h)

744

size = len(h)

734

yield h

745

yield h

735

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

746

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

736

size += len(chunk)

747

size += len(chunk)

737

yield chunk

748

yield chunk

738

self._verbosenote(_('%8.i %s\n') % (size, fname))

749

self._verbosenote(_('%8.i %s\n') % (size, fname))

739

progress(msgbundling, None)

750

progress(msgbundling, None)

740

751

741

def deltaparent(self, revlog, rev, p1, p2, prev):

752

def deltaparent(self, revlog, rev, p1, p2, prev):

742

return prev

753

return prev

743

754

744

def revchunk(self, revlog, rev, prev, linknode):

755

def revchunk(self, revlog, rev, prev, linknode):

745

node = revlog.node(rev)

756

node = revlog.node(rev)

746

p1, p2 = revlog.parentrevs(rev)

757

p1, p2 = revlog.parentrevs(rev)

747

base = self.deltaparent(revlog, rev, p1, p2, prev)

758

base = self.deltaparent(revlog, rev, p1, p2, prev)

748

759

749

prefix = ''

760

prefix = ''

750

if revlog.iscensored(base) or revlog.iscensored(rev):

761

if revlog.iscensored(base) or revlog.iscensored(rev):

751

try:

762

try:

752

delta = revlog.revision(node)

763

delta = revlog.revision(node)

753

except error.CensoredNodeError as e:

764

except error.CensoredNodeError as e:

754

delta = e.tombstone

765

delta = e.tombstone

755

if base == nullrev:

766

if base == nullrev:

756

prefix = mdiff.trivialdiffheader(len(delta))

767

prefix = mdiff.trivialdiffheader(len(delta))

757

else:

768

else:

758

baselen = revlog.rawsize(base)

769

baselen = revlog.rawsize(base)

759

prefix = mdiff.replacediffheader(baselen, len(delta))

770

prefix = mdiff.replacediffheader(baselen, len(delta))

760

elif base == nullrev:

771

elif base == nullrev:

761

delta = revlog.revision(node)

772

delta = revlog.revision(node)

762

prefix = mdiff.trivialdiffheader(len(delta))

773

prefix = mdiff.trivialdiffheader(len(delta))

763

else:

774

else:

764

delta = revlog.revdiff(base, rev)

775

delta = revlog.revdiff(base, rev)

765

p1n, p2n = revlog.parents(node)

776

p1n, p2n = revlog.parents(node)

766

basenode = revlog.node(base)

777

basenode = revlog.node(base)

767

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

778

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

768

meta += prefix

779

meta += prefix

769

l = len(meta) + len(delta)

780

l = len(meta) + len(delta)

770

yield chunkheader(l)

781

yield chunkheader(l)

771

yield meta

782

yield meta

772

yield delta

783

yield delta

773

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

784

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

774

# do nothing with basenode, it is implicitly the previous one in HG10

785

# do nothing with basenode, it is implicitly the previous one in HG10

775

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

786

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

776

787

777

class cg2packer(cg1packer):

788

class cg2packer(cg1packer):

778

version = '02'

789

version = '02'

779

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

790

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

780

791

781

def __init__(self, repo, bundlecaps=None):

792

def __init__(self, repo, bundlecaps=None):

782

super(cg2packer, self).__init__(repo, bundlecaps)

793

super(cg2packer, self).__init__(repo, bundlecaps)

783

if self._reorder is None:

794

if self._reorder is None:

784

# Since generaldelta is directly supported by cg2, reordering

795

# Since generaldelta is directly supported by cg2, reordering

785

# generally doesn't help, so we disable it by default (treating

796

# generally doesn't help, so we disable it by default (treating

786

# bundle.reorder=auto just like bundle.reorder=False).

797

# bundle.reorder=auto just like bundle.reorder=False).

787

self._reorder = False

798

self._reorder = False

788

799

789

def deltaparent(self, revlog, rev, p1, p2, prev):

800

def deltaparent(self, revlog, rev, p1, p2, prev):

790

dp = revlog.deltaparent(rev)

801

dp = revlog.deltaparent(rev)

791

# avoid storing full revisions; pick prev in those cases

802

# avoid storing full revisions; pick prev in those cases

792

# also pick prev when we can't be sure remote has dp

803

# also pick prev when we can't be sure remote has dp

793

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

804

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

794

return prev

805

return prev

795

return dp

806

return dp

796

807

797

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

808

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

798

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

809

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

799

810

800

packermap = {'01': (cg1packer, cg1unpacker),

811

packermap = {'01': (cg1packer, cg1unpacker),

801

# cg2 adds support for exchanging generaldelta

812

# cg2 adds support for exchanging generaldelta

802

'02': (cg2packer, cg2unpacker),

813

'02': (cg2packer, cg2unpacker),

803

}

814

}

804

815

805

def _changegroupinfo(repo, nodes, source):

816

def _changegroupinfo(repo, nodes, source):

806

if repo.ui.verbose or source == 'bundle':

817

if repo.ui.verbose or source == 'bundle':

807

repo.ui.status(_("%d changesets found\n") % len(nodes))

818

repo.ui.status(_("%d changesets found\n") % len(nodes))

808

if repo.ui.debugflag:

819

if repo.ui.debugflag:

809

repo.ui.debug("list of changesets:\n")

820

repo.ui.debug("list of changesets:\n")

810

for node in nodes:

821

for node in nodes:

811

repo.ui.debug("%s\n" % hex(node))

822

repo.ui.debug("%s\n" % hex(node))

812

823

813

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

824

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

814

repo = repo.unfiltered()

825

repo = repo.unfiltered()

815

commonrevs = outgoing.common

826

commonrevs = outgoing.common

816

csets = outgoing.missing

827

csets = outgoing.missing

817

heads = outgoing.missingheads

828

heads = outgoing.missingheads

818

# We go through the fast path if we get told to, or if all (unfiltered

829

# We go through the fast path if we get told to, or if all (unfiltered

819

# heads have been requested (since we then know there all linkrevs will

830

# heads have been requested (since we then know there all linkrevs will

820

# be pulled by the client).

831

# be pulled by the client).

821

heads.sort()

832

heads.sort()

822

fastpathlinkrev = fastpath or (

833

fastpathlinkrev = fastpath or (

823

repo.filtername is None and heads == sorted(repo.heads()))

834

repo.filtername is None and heads == sorted(repo.heads()))

824

835

825

repo.hook('preoutgoing', throw=True, source=source)

836

repo.hook('preoutgoing', throw=True, source=source)

826

_changegroupinfo(repo, csets, source)

837

_changegroupinfo(repo, csets, source)

827

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

838

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

828

839

829

def getsubset(repo, outgoing, bundler, source, fastpath=False):

840

def getsubset(repo, outgoing, bundler, source, fastpath=False):

830

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

841

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

831

return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)

842

return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)

832

843

833

def changegroupsubset(repo, roots, heads, source, version='01'):

844

def changegroupsubset(repo, roots, heads, source, version='01'):

834

"""Compute a changegroup consisting of all the nodes that are

845

"""Compute a changegroup consisting of all the nodes that are

835

descendants of any of the roots and ancestors of any of the heads.

846

descendants of any of the roots and ancestors of any of the heads.

836

Return a chunkbuffer object whose read() method will return

847

Return a chunkbuffer object whose read() method will return

837

successive changegroup chunks.

848

successive changegroup chunks.

838

849

839

It is fairly complex as determining which filenodes and which

850

It is fairly complex as determining which filenodes and which

840

manifest nodes need to be included for the changeset to be complete

851

manifest nodes need to be included for the changeset to be complete

841

is non-trivial.

852

is non-trivial.

842

853

843

Another wrinkle is doing the reverse, figuring out which changeset in

854

Another wrinkle is doing the reverse, figuring out which changeset in

844

the changegroup a particular filenode or manifestnode belongs to.

855

the changegroup a particular filenode or manifestnode belongs to.

845

"""

856

"""

846

cl = repo.changelog

857

cl = repo.changelog

847

if not roots:

858

if not roots:

848

roots = [nullid]

859

roots = [nullid]

849

discbases = []

860

discbases = []

850

for n in roots:

861

for n in roots:

851

discbases.extend([p for p in cl.parents(n) if p != nullid])

862

discbases.extend([p for p in cl.parents(n) if p != nullid])

852

# TODO: remove call to nodesbetween.

863

# TODO: remove call to nodesbetween.

853

csets, roots, heads = cl.nodesbetween(roots, heads)

864

csets, roots, heads = cl.nodesbetween(roots, heads)

854

included = set(csets)

865

included = set(csets)

855

discbases = [n for n in discbases if n not in included]

866

discbases = [n for n in discbases if n not in included]

856

outgoing = discovery.outgoing(cl, discbases, heads)

867

outgoing = discovery.outgoing(cl, discbases, heads)

857

bundler = packermap[version][0](repo)

868

bundler = packermap[version][0](repo)

858

return getsubset(repo, outgoing, bundler, source)

869

return getsubset(repo, outgoing, bundler, source)

859

870

860

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

871

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

861

version='01'):

872

version='01'):

862

"""Like getbundle, but taking a discovery.outgoing as an argument.

873

"""Like getbundle, but taking a discovery.outgoing as an argument.

863

874

864

This is only implemented for local repos and reuses potentially

875

This is only implemented for local repos and reuses potentially

865

precomputed sets in outgoing. Returns a raw changegroup generator."""

876

precomputed sets in outgoing. Returns a raw changegroup generator."""

866

if not outgoing.missing:

877

if not outgoing.missing:

867

return None

878

return None

868

bundler = packermap[version][0](repo, bundlecaps)

879

bundler = packermap[version][0](repo, bundlecaps)

869

return getsubsetraw(repo, outgoing, bundler, source)

880

return getsubsetraw(repo, outgoing, bundler, source)

870

881

871

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

882

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

872

version='01'):

883

version='01'):

873

"""Like getbundle, but taking a discovery.outgoing as an argument.

884

"""Like getbundle, but taking a discovery.outgoing as an argument.

874

885

875

This is only implemented for local repos and reuses potentially

886

This is only implemented for local repos and reuses potentially

876

precomputed sets in outgoing."""

887

precomputed sets in outgoing."""

877

if not outgoing.missing:

888

if not outgoing.missing:

878

return None

889

return None

879

bundler = packermap[version][0](repo, bundlecaps)

890

bundler = packermap[version][0](repo, bundlecaps)

880

return getsubset(repo, outgoing, bundler, source)

891

return getsubset(repo, outgoing, bundler, source)

881

892

882

def computeoutgoing(repo, heads, common):

893

def computeoutgoing(repo, heads, common):

883

"""Computes which revs are outgoing given a set of common

894

"""Computes which revs are outgoing given a set of common

884

and a set of heads.

895

and a set of heads.

885

896

886

This is a separate function so extensions can have access to

897

This is a separate function so extensions can have access to

887

the logic.

898

the logic.

888

899

889

Returns a discovery.outgoing object.

900

Returns a discovery.outgoing object.

890

"""

901

"""

891

cl = repo.changelog

902

cl = repo.changelog

892

if common:

903

if common:

893

hasnode = cl.hasnode

904

hasnode = cl.hasnode

894

common = [n for n in common if hasnode(n)]

905

common = [n for n in common if hasnode(n)]

895

else:

906

else:

896

common = [nullid]

907

common = [nullid]

897

if not heads:

908

if not heads:

898

heads = cl.heads()

909

heads = cl.heads()

899

return discovery.outgoing(cl, common, heads)

910

return discovery.outgoing(cl, common, heads)

900

911

901

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

912

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

902

version='01'):

913

version='01'):

903

"""Like changegroupsubset, but returns the set difference between the

914

"""Like changegroupsubset, but returns the set difference between the

904

ancestors of heads and the ancestors common.

915

ancestors of heads and the ancestors common.

905

916

906

If heads is None, use the local heads. If common is None, use [nullid].

917

If heads is None, use the local heads. If common is None, use [nullid].

907

918

908

The nodes in common might not all be known locally due to the way the

919

The nodes in common might not all be known locally due to the way the

909

current discovery protocol works.

920

current discovery protocol works.

910

"""

921

"""

911

outgoing = computeoutgoing(repo, heads, common)

922

outgoing = computeoutgoing(repo, heads, common)

912

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

923

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

913

version=version)

924

version=version)

914

925

915

def changegroup(repo, basenodes, source):

926

def changegroup(repo, basenodes, source):

916

# to avoid a race we use changegroupsubset() (issue1320)

927

# to avoid a race we use changegroupsubset() (issue1320)

917

return changegroupsubset(repo, basenodes, repo.heads(), source)

928

return changegroupsubset(repo, basenodes, repo.heads(), source)

918

929

919

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):

930

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):

920

revisions = 0

931

revisions = 0

921

files = 0

932

files = 0

922

while True:

933

while True:

923

chunkdata = source.filelogheader()

934

chunkdata = source.filelogheader()

924

if not chunkdata:

935

if not chunkdata:

925

break

936

break

926

f = chunkdata["filename"]

937

f = chunkdata["filename"]

927

repo.ui.debug("adding %s revisions\n" % f)

938

repo.ui.debug("adding %s revisions\n" % f)

928

pr()

939

pr()

929

fl = repo.file(f)

940

fl = repo.file(f)

930

o = len(fl)

941

o = len(fl)

931

try:

942

try:

932

if not fl.addgroup(source, revmap, trp):

943

if not fl.addgroup(source, revmap, trp):

933

raise error.Abort(_("received file revlog group is empty"))

944

raise error.Abort(_("received file revlog group is empty"))

934

except error.CensoredBaseError as e:

945

except error.CensoredBaseError as e:

935

raise error.Abort(_("received delta base is censored: %s") % e)

946

raise error.Abort(_("received delta base is censored: %s") % e)

936

revisions += len(fl) - o

947

revisions += len(fl) - o

937

files += 1

948

files += 1

938

if f in needfiles:

949

if f in needfiles:

939

needs = needfiles[f]

950

needs = needfiles[f]

940

for new in xrange(o, len(fl)):

951

for new in xrange(o, len(fl)):

941

n = fl.node(new)

952

n = fl.node(new)

942

if n in needs:

953

if n in needs:

943

needs.remove(n)

954

needs.remove(n)

944

else:

955

else:

945

raise error.Abort(

956

raise error.Abort(

946

_("received spurious file revlog entry"))

957

_("received spurious file revlog entry"))

947

if not needs:

958

if not needs:

948

del needfiles[f]

959

del needfiles[f]

949

repo.ui.progress(_('files'), None)

960

repo.ui.progress(_('files'), None)

950

961

951

for f, needs in needfiles.iteritems():

962

for f, needs in needfiles.iteritems():

952

fl = repo.file(f)

963

fl = repo.file(f)

953

for n in needs:

964

for n in needs:

954

try:

965

try:

955

fl.rev(n)

966

fl.rev(n)

956

except error.LookupError:

967

except error.LookupError:

957

raise error.Abort(

968

raise error.Abort(

958

_('missing file data for %s:%s - run hg verify') %

969

_('missing file data for %s:%s - run hg verify') %

959

(f, hex(n)))

970

(f, hex(n)))

960

971

961

return revisions, files

972

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import tempfile
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from . import (
                 branchmap,
                 dagutil,
                 discovery,
                 error,
                 mdiff,
                 phases,
                 util,
             )
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             bundletypes = {
                 "": ("", None),       # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", None),
                 "HG10BZ": ("HG10", 'BZ'),
                 "HG10GZ": ("HG10GZ", 'GZ'),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 if bundletype == "HG20":
                     from . import bundle2
                     bundle = bundle2.bundle20(ui)
                     bundle.setcompression(compression)
                     part = bundle.newpart('changegroup', data=cg.getchunks())
                     part.addparam('version', cg.version)
                     chunkiter = bundle.getchunks()
                 else:
                     # compression argument is only for the bundle2 case
                     assert compression is None
                     if cg.version != '01':
                         raise error.Abort(_('old bundle types only supports v1 '
                                             'changegroups'))
                     header, comp = bundletypes[bundletype]
                     if comp not in util.compressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                           % comp)
                     z = util.compressors[comp]()
                     subchunkiter = cg.getchunks()
                     def chunkiter():
                         yield header
                         for chunk in subchunkiter:
                             yield z.compress(chunk)
                         yield z.flush()
                     chunkiter = chunkiter()
                 # parse the changegroup data, otherwise we will block
                 # in case of sshrepo because we don't know the end of the stream
                 # an empty chunkgroup is the end of the changegroup
                 # a changegroup has at least 2 chunkgroups (changelog and manifest).
                 # after that, an empty chunkgroup is the end of the changegroup
                 return writechunks(ui, chunkiter, filename, vfs=vfs)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 def __init__(self, fh, alg):
                     if alg == 'UN':
                         alg = None # get more modern without breaking too much
                     if not alg in util.decompressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     self._stream = util.decompressors[alg](fh)
                     self._type = alg
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     return node, p1, p2, deltabase, cs
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, an empty chunkgroup is the end of the changegroup
                     empty = False
                     count = 0
                     while not empty or count <= 2:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     # We know that we'll never have more manifests than we had
                     # changesets.
                     self.callback = prog(_('manifests'), numchanges)
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     repo.manifest.addgroup(self, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                 def apply(self, repo, srctype, url, emptyok=False,
                           targetphase=phases.draft, expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     wasempty = (len(repo.changelog) == 0)
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))
                     try:
                         # The transaction could have been created before and already
                         # carries source information. In this case we use the top
                         # level data. We overwrite the argument because we need to use
                         # the top level value (if they exist) in this function.
                         srctype = tr.hookargs.setdefault('source', srctype)
                         url = tr.hookargs.setdefault('url', url)
                         repo.hook('prechangegroup', throw=True, **tr.hookargs)
                         # write changelog data to temp files so concurrent readers
                         # will not see an inconsistent view
                         cl = repo.changelog
                         cl.delayupdate(tr)
                         oldheads = cl.heads()
                         trp = weakref.proxy(tr)
                         # pull off the changeset group
                         repo.ui.status(_("adding changesets\n"))
                         clstart = len(cl)
                         class prog(object):
                             def __init__(self, step, total):
                                 self._step = step
                                 self._total = total
                                 self._count = 1
                             def __call__(self):
                                 repo.ui.progress(self._step, self._count, unit=_('chunks'),
                                                  total=self._total)
                                 self._count += 1
                         self.callback = prog(_('changesets'), expectedtotal)
                         efiles = set()
                         def onchangelog(cl, node):
                             efiles.update(cl.read(node)[3])
                         self.changelogheader()
                         srccontent = cl.addgroup(self, csmap, trp,
                                                  addrevisioncb=onchangelog)
                         efiles = len(efiles)
                         if not (srccontent or emptyok):
                             raise error.Abort(_("received changelog group is empty"))
                         clend = len(cl)
                         changesets = clend - clstart
                         repo.ui.progress(_('changesets'), None)
                         # pull off the manifest group
                         repo.ui.status(_("adding manifests\n"))
                         self._unpackmanifests(repo, revmap, trp, prog, changesets)
                         needfiles = {}
                         if repo.ui.configbool('server', 'validate', default=False):
                             # validate incoming csets have their manifests
                             for cset in xrange(clstart, clend):
                                 mfnode = repo.changelog.read(repo.changelog.node(cset))[0]
                                 mfest = repo.manifest.readdelta(mfnode)
                                 # store file nodes we must see
                                 for f, n in mfest.iteritems():
                                     needfiles.setdefault(f, set()).add(n)
                         # process the files
                         repo.ui.status(_("adding file changes\n"))
                         self.callback = None
                         pr = prog(_('files'), efiles)
                         newrevs, newfiles = _addchangegroupfiles(
                             repo, self, revmap, trp, pr, needfiles, wasempty)
                         revisions += newrevs
                         files += newfiles
                         dh = 0
                         if oldheads:
                             heads = cl.heads()
                             dh = len(heads) - len(oldheads)
                             for h in heads:
                                 if h not in oldheads and repo[h].closesbranch():
                                     dh -= 1
                         htext = ""
                         if dh:
                             htext = _(" (%+d heads)") % dh
                         repo.ui.status(_("added %d changesets"
                                          " with %d changes to %d files%s\n")
                                          % (changesets, revisions, files, htext))
                         repo.invalidatevolatilesets()
                         if changesets > 0:
                             if 'node' not in tr.hookargs:
                                 tr.hookargs['node'] = hex(cl.node(clstart))
                                 hookargs = dict(tr.hookargs)
                             else:
                                 hookargs = dict(tr.hookargs)
                                 hookargs['node'] = hex(cl.node(clstart))
                             repo.hook('pretxnchangegroup', throw=True, **hookargs)
                         added = [cl.node(r) for r in xrange(clstart, clend)]
                         publishing = repo.publishing()
                         if srctype in ('push', 'serve'):
                             # Old servers can not push the boundary themselves.
                             # New servers won't push the boundary if changeset already
                             # exists locally as secret
                             #
                             # We should not use added here but the list of all change in
                             # the bundle
                             if publishing:
                                 phases.advanceboundary(repo, tr, phases.public, srccontent)
                             else:
                                 # Those changesets have been pushed from the outside, their
                                 # phases are going to be pushed alongside. Therefor
                                 # `targetphase` is ignored.
                                 phases.advanceboundary(repo, tr, phases.draft, srccontent)
                                 phases.retractboundary(repo, tr, phases.draft, added)
                         elif srctype != 'strip':
                             # publishing only alter behavior during push
                             #
                             # strip should not touch boundary at all
                             phases.retractboundary(repo, tr, targetphase, added)
                         if changesets > 0:
                             if srctype != 'strip':
                                 # During strip, branchcache is invalid but coming call to
                                 # `destroyed` will repair it.
                                 # In other case we can safely update cache on disk.
                                 branchmap.updatecache(repo.filtered('served'))
                             def runhooks():
                                 # These hooks run when the lock releases, not when the
                                 # transaction closes. So it's possible for the changelog
                                 # to have changed since we last saw it.
                                 if clstart >= len(repo):
                                     return
                                 # forcefully update the on-disk branch cache
                                 repo.ui.debug("updating the branch cache\n")
                                 repo.hook("changegroup", **hookargs)
                                 for n in added:
                                     args = hookargs.copy()
                                     args['node'] = hex(n)
                                     repo.hook("incoming", **args)
                                 newheads = [h for h in repo.heads() if h not in oldheads]
                                 repo.ui.log("incoming",
                                             "%s incoming changes - new heads: %s\n",
                                             len(added),
                                             ', '.join([hex(c[:6]) for c in newheads]))
                             tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                             lambda tr: repo._afterlock(runhooks))
                         tr.close()
                     finally:
                         tr.release()
                         repo.ui.flush()
                     # never return 0 here:
                     if dh < 0:
                         return dh - 1
                     else:
                         return dh + 1
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     return node, p1, p2, deltabase, cs
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     if units is not None:
                         self._progress(msgbundling, None)
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def _packmanifests(self, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
                     ml = self._repo.manifest
                     size = 0
                     for chunk in self.group(
                             mfnodes, ml, lookuplinknode, units=_('manifests')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     ml = repo.manifest
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
-                    changedfiles = set()
+                    # maps manifest node id -> set(changed files)
+                    mfchangedfiles = {}
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
-                        changedfiles.update(c[3])
+                        n = c[0]
                         # record the first changeset introducing this manifest version
-                        mfs.setdefault(c[0], x)
+                        mfs.setdefault(n, x)
+                        # Record a complete list of potentially-changed files in
+                        # this manifest.
+                        mfchangedfiles.setdefault(n, set()).update(c[3])
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def lookupmflinknode(x):
                         """Callback for looking up the linknode for manifests.
                         Returns the linkrev node for the specified manifest.
                         SIDE EFFECT:
                           fclnodes gets populated with the list of relevant
                           file nodes if we're not using fastpathlinkrev.
                         Note that this means you can't trust fclnodes until
                         after manifests have been sent to the client.
                         """
                         clnode = mfs[x]
                         if not fastpathlinkrev:
                             mdata = ml.readfast(x)
-                            for f, n in mdata.iteritems():
+                            for f in mfchangedfiles[x]:
-                                if f in changedfiles:
+                                if True:
+                                    try:
+                                        n = mdata[f]
+                                    except KeyError:
+                                        continue
                                     # record the first changeset introducing this filelog
                                     # version
                                     fclnodes = fnodes.setdefault(f, {})
                                     fclnode = fclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[fclnode]:
                                         fclnodes[n] = clnode
                         return clnode
                     mfnodes = self.prune(ml, mfs, commonrevs)
                     for x in self._packmanifests(mfnodes, lookupmflinknode):
                         yield x
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     def linknodes(filerevlog, fname):
                         if fastpathlinkrev:
                             llr = filerevlog.linkrev
                             def genfilenodes():
                                 for r in filerevlog:
                                     linkrev = llr(r)
                                     if linkrev in clrevs:
                                         yield filerevlog.node(r), cl.node(linkrev)
                             return dict(genfilenodes())
                         return fnodes.get(fname, {})
+                    changedfiles = set()
+                    for x in mfchangedfiles.itervalues():
+                        changedfiles.update(x)
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress(msgbundling, None)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def __init__(self, repo, bundlecaps=None):
                     super(cg2packer, self).__init__(repo, bundlecaps)
                     if self._reorder is None:
                         # Since generaldelta is directly supported by cg2, reordering
                         # generally doesn't help, so we disable it by default (treating
                         # bundle.reorder=auto just like bundle.reorder=False).
                         self._reorder = False
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             packermap = {'01': (cg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (cg2packer, cg2unpacker),
             }
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 included = set(csets)
                 discbases = [n for n in discbases if n not in included]
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = packermap[version][0](repo)
                 return getsubset(repo, outgoing, bundler, source)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,
                                     version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,
                                version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,
                                            version=version)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files