upstream/mercurial-mirror Commit - r27238:c3dc0310

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import tempfile

12

import tempfile

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

hex,

17

hex,

18

nullid,

18

nullid,

19

nullrev,

19

nullrev,

20

short,

20

short,

21

)

21

)

22

23

from . import (

23

from . import (

24

branchmap,

24

branchmap,

25

dagutil,

25

dagutil,

26

discovery,

26

discovery,

27

error,

27

error,

28

mdiff,

28

mdiff,

29

phases,

29

phases,

30

util,

30

util,

31

)

31

)

32

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

35

36

def readexactly(stream, n):

36

def readexactly(stream, n):

37

'''read n bytes from stream.read and abort if less was available'''

37

'''read n bytes from stream.read and abort if less was available'''

38

s = stream.read(n)

38

s = stream.read(n)

39

if len(s) < n:

39

if len(s) < n:

40

raise error.Abort(_("stream ended unexpectedly"

40

raise error.Abort(_("stream ended unexpectedly"

41

" (got %d bytes, expected %d)")

41

" (got %d bytes, expected %d)")

42

% (len(s), n))

42

% (len(s), n))

43

return s

43

return s

44

45

def getchunk(stream):

45

def getchunk(stream):

46

"""return the next chunk from stream as a string"""

46

"""return the next chunk from stream as a string"""

47

d = readexactly(stream, 4)

47

d = readexactly(stream, 4)

48

l = struct.unpack(">l", d)[0]

48

l = struct.unpack(">l", d)[0]

49

if l <= 4:

49

if l <= 4:

50

if l:

50

if l:

51

raise error.Abort(_("invalid chunk length %d") % l)

51

raise error.Abort(_("invalid chunk length %d") % l)

52

return ""

52

return ""

53

return readexactly(stream, l - 4)

53

return readexactly(stream, l - 4)

54

55

def chunkheader(length):

55

def chunkheader(length):

56

"""return a changegroup chunk header (string)"""

56

"""return a changegroup chunk header (string)"""

57

return struct.pack(">l", length + 4)

57

return struct.pack(">l", length + 4)

58

59

def closechunk():

59

def closechunk():

60

"""return a changegroup chunk header (string) for a zero-length chunk"""

60

"""return a changegroup chunk header (string) for a zero-length chunk"""

61

return struct.pack(">l", 0)

61

return struct.pack(">l", 0)

62

63

def combineresults(results):

63

def combineresults(results):

64

"""logic to combine 0 or more addchangegroup results into one"""

64

"""logic to combine 0 or more addchangegroup results into one"""

65

changedheads = 0

65

changedheads = 0

66

result = 1

66

result = 1

67

for ret in results:

67

for ret in results:

68

# If any changegroup result is 0, return 0

68

# If any changegroup result is 0, return 0

69

if ret == 0:

69

if ret == 0:

70

result = 0

70

result = 0

71

break

71

break

72

if ret < -1:

72

if ret < -1:

73

changedheads += ret + 1

73

changedheads += ret + 1

74

elif ret > 1:

74

elif ret > 1:

75

changedheads += ret - 1

75

changedheads += ret - 1

76

if changedheads > 0:

76

if changedheads > 0:

77

result = 1 + changedheads

77

result = 1 + changedheads

78

elif changedheads < 0:

78

elif changedheads < 0:

79

result = -1 + changedheads

79

result = -1 + changedheads

80

return result

80

return result

81

82

bundletypes = {

82

bundletypes = {

83

"": ("", None), # only when using unbundle on ssh and old http servers

83

"": ("", None), # only when using unbundle on ssh and old http servers

84

# since the unification ssh accepts a header but there

84

# since the unification ssh accepts a header but there

85

# is no capability signaling it.

85

# is no capability signaling it.

86

"HG20": (), # special-cased below

86

"HG20": (), # special-cased below

87

"HG10UN": ("HG10UN", None),

87

"HG10UN": ("HG10UN", None),

88

"HG10BZ": ("HG10", 'BZ'),

88

"HG10BZ": ("HG10", 'BZ'),

89

"HG10GZ": ("HG10GZ", 'GZ'),

89

"HG10GZ": ("HG10GZ", 'GZ'),

90

}

90

}

91

92

# hgweb uses this list to communicate its preferred type

92

# hgweb uses this list to communicate its preferred type

93

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

93

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

94

95

def writechunks(ui, chunks, filename, vfs=None):

95

def writechunks(ui, chunks, filename, vfs=None):

96

"""Write chunks to a file and return its filename.

96

"""Write chunks to a file and return its filename.

97

98

The stream is assumed to be a bundle file.

98

The stream is assumed to be a bundle file.

99

Existing files will not be overwritten.

99

Existing files will not be overwritten.

100

If no filename is specified, a temporary file is created.

100

If no filename is specified, a temporary file is created.

101

"""

101

"""

102

fh = None

102

fh = None

103

cleanup = None

103

cleanup = None

104

try:

104

try:

105

if filename:

105

if filename:

106

if vfs:

106

if vfs:

107

fh = vfs.open(filename, "wb")

107

fh = vfs.open(filename, "wb")

108

else:

108

else:

109

fh = open(filename, "wb")

109

fh = open(filename, "wb")

110

else:

110

else:

111

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

111

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

112

fh = os.fdopen(fd, "wb")

112

fh = os.fdopen(fd, "wb")

113

cleanup = filename

113

cleanup = filename

114

for c in chunks:

114

for c in chunks:

115

fh.write(c)

115

fh.write(c)

116

cleanup = None

116

cleanup = None

117

return filename

117

return filename

118

finally:

118

finally:

119

if fh is not None:

119

if fh is not None:

120

fh.close()

120

fh.close()

121

if cleanup is not None:

121

if cleanup is not None:

122

if filename and vfs:

122

if filename and vfs:

123

vfs.unlink(cleanup)

123

vfs.unlink(cleanup)

124

else:

124

else:

125

os.unlink(cleanup)

125

os.unlink(cleanup)

126

127

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

127

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

128

"""Write a bundle file and return its filename.

128

"""Write a bundle file and return its filename.

129

130

Existing files will not be overwritten.

130

Existing files will not be overwritten.

131

If no filename is specified, a temporary file is created.

131

If no filename is specified, a temporary file is created.

132

bz2 compression can be turned off.

132

bz2 compression can be turned off.

133

The bundle file will be deleted in case of errors.

133

The bundle file will be deleted in case of errors.

134

"""

134

"""

135

136

if bundletype == "HG20":

136

if bundletype == "HG20":

137

from . import bundle2

137

from . import bundle2

138

bundle = bundle2.bundle20(ui)

138

bundle = bundle2.bundle20(ui)

139

bundle.setcompression(compression)

139

bundle.setcompression(compression)

140

part = bundle.newpart('changegroup', data=cg.getchunks())

140

part = bundle.newpart('changegroup', data=cg.getchunks())

141

part.addparam('version', cg.version)

141

part.addparam('version', cg.version)

142

chunkiter = bundle.getchunks()

142

chunkiter = bundle.getchunks()

143

else:

143

else:

144

# compression argument is only for the bundle2 case

144

# compression argument is only for the bundle2 case

145

assert compression is None

145

assert compression is None

146

if cg.version != '01':

146

if cg.version != '01':

147

raise error.Abort(_('old bundle types only supports v1 '

147

raise error.Abort(_('old bundle types only supports v1 '

148

'changegroups'))

148

'changegroups'))

149

header, comp = bundletypes[bundletype]

149

header, comp = bundletypes[bundletype]

150

if comp not in util.compressors:

150

if comp not in util.compressors:

151

raise error.Abort(_('unknown stream compression type: %s')

151

raise error.Abort(_('unknown stream compression type: %s')

152

% comp)

152

% comp)

153

z = util.compressors[comp]()

153

z = util.compressors[comp]()

154

subchunkiter = cg.getchunks()

154

subchunkiter = cg.getchunks()

155

def chunkiter():

155

def chunkiter():

156

yield header

156

yield header

157

for chunk in subchunkiter:

157

for chunk in subchunkiter:

158

yield z.compress(chunk)

158

yield z.compress(chunk)

159

yield z.flush()

159

yield z.flush()

160

chunkiter = chunkiter()

160

chunkiter = chunkiter()

161

162

# parse the changegroup data, otherwise we will block

162

# parse the changegroup data, otherwise we will block

163

# in case of sshrepo because we don't know the end of the stream

163

# in case of sshrepo because we don't know the end of the stream

164

165

# an empty chunkgroup is the end of the changegroup

165

# an empty chunkgroup is the end of the changegroup

166

# a changegroup has at least 2 chunkgroups (changelog and manifest).

166

# a changegroup has at least 2 chunkgroups (changelog and manifest).

167

# after that, an empty chunkgroup is the end of the changegroup

167

# after that, an empty chunkgroup is the end of the changegroup

168

return writechunks(ui, chunkiter, filename, vfs=vfs)

168

return writechunks(ui, chunkiter, filename, vfs=vfs)

169

170

class cg1unpacker(object):

170

class cg1unpacker(object):

171

"""Unpacker for cg1 changegroup streams.

171

"""Unpacker for cg1 changegroup streams.

172

173

A changegroup unpacker handles the framing of the revision data in

173

A changegroup unpacker handles the framing of the revision data in

174

the wire format. Most consumers will want to use the apply()

174

the wire format. Most consumers will want to use the apply()

175

method to add the changes from the changegroup to a repository.

175

method to add the changes from the changegroup to a repository.

176

177

If you're forwarding a changegroup unmodified to another consumer,

177

If you're forwarding a changegroup unmodified to another consumer,

178

use getchunks(), which returns an iterator of changegroup

178

use getchunks(), which returns an iterator of changegroup

179

chunks. This is mostly useful for cases where you need to know the

179

chunks. This is mostly useful for cases where you need to know the

180

data stream has ended by observing the end of the changegroup.

180

data stream has ended by observing the end of the changegroup.

181

182

deltachunk() is useful only if you're applying delta data. Most

182

deltachunk() is useful only if you're applying delta data. Most

183

consumers should prefer apply() instead.

183

consumers should prefer apply() instead.

184

185

A few other public methods exist. Those are used only for

185

A few other public methods exist. Those are used only for

186

bundlerepo and some debug commands - their use is discouraged.

186

bundlerepo and some debug commands - their use is discouraged.

187

"""

187

"""

188

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

188

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

189

deltaheadersize = struct.calcsize(deltaheader)

189

deltaheadersize = struct.calcsize(deltaheader)

190

version = '01'

190

version = '01'

191

def __init__(self, fh, alg):

191

def __init__(self, fh, alg):

192

if alg == 'UN':

192

if alg == 'UN':

193

alg = None # get more modern without breaking too much

193

alg = None # get more modern without breaking too much

194

if not alg in util.decompressors:

194

if not alg in util.decompressors:

195

raise error.Abort(_('unknown stream compression type: %s')

195

raise error.Abort(_('unknown stream compression type: %s')

196

% alg)

196

% alg)

197

if alg == 'BZ':

197

if alg == 'BZ':

198

alg = '_truncatedBZ'

198

alg = '_truncatedBZ'

199

self._stream = util.decompressors[alg](fh)

199

self._stream = util.decompressors[alg](fh)

200

self._type = alg

200

self._type = alg

201

self.callback = None

201

self.callback = None

202

203

# These methods (compressed, read, seek, tell) all appear to only

203

# These methods (compressed, read, seek, tell) all appear to only

204

# be used by bundlerepo, but it's a little hard to tell.

204

# be used by bundlerepo, but it's a little hard to tell.

205

def compressed(self):

205

def compressed(self):

206

return self._type is not None

206

return self._type is not None

207

def read(self, l):

207

def read(self, l):

208

return self._stream.read(l)

208

return self._stream.read(l)

209

def seek(self, pos):

209

def seek(self, pos):

210

return self._stream.seek(pos)

210

return self._stream.seek(pos)

211

def tell(self):

211

def tell(self):

212

return self._stream.tell()

212

return self._stream.tell()

213

def close(self):

213

def close(self):

214

return self._stream.close()

214

return self._stream.close()

215

216

def _chunklength(self):

216

def _chunklength(self):

217

d = readexactly(self._stream, 4)

217

d = readexactly(self._stream, 4)

218

l = struct.unpack(">l", d)[0]

218

l = struct.unpack(">l", d)[0]

219

if l <= 4:

219

if l <= 4:

220

if l:

220

if l:

221

raise error.Abort(_("invalid chunk length %d") % l)

221

raise error.Abort(_("invalid chunk length %d") % l)

222

return 0

222

return 0

223

if self.callback:

223

if self.callback:

224

self.callback()

224

self.callback()

225

return l - 4

225

return l - 4

226

227

def changelogheader(self):

227

def changelogheader(self):

228

"""v10 does not have a changelog header chunk"""

228

"""v10 does not have a changelog header chunk"""

229

return {}

229

return {}

230

231

def manifestheader(self):

231

def manifestheader(self):

232

"""v10 does not have a manifest header chunk"""

232

"""v10 does not have a manifest header chunk"""

233

return {}

233

return {}

234

235

def filelogheader(self):

235

def filelogheader(self):

236

"""return the header of the filelogs chunk, v10 only has the filename"""

236

"""return the header of the filelogs chunk, v10 only has the filename"""

237

l = self._chunklength()

237

l = self._chunklength()

238

if not l:

238

if not l:

239

return {}

239

return {}

240

fname = readexactly(self._stream, l)

240

fname = readexactly(self._stream, l)

241

return {'filename': fname}

241

return {'filename': fname}

242

243

def _deltaheader(self, headertuple, prevnode):

243

def _deltaheader(self, headertuple, prevnode):

244

node, p1, p2, cs = headertuple

244

node, p1, p2, cs = headertuple

245

if prevnode is None:

245

if prevnode is None:

246

deltabase = p1

246

deltabase = p1

247

else:

247

else:

248

deltabase = prevnode

248

deltabase = prevnode

249

return node, p1, p2, deltabase, cs

249

return node, p1, p2, deltabase, cs

250

251

def deltachunk(self, prevnode):

251

def deltachunk(self, prevnode):

252

l = self._chunklength()

252

l = self._chunklength()

253

if not l:

253

if not l:

254

return {}

254

return {}

255

headerdata = readexactly(self._stream, self.deltaheadersize)

255

headerdata = readexactly(self._stream, self.deltaheadersize)

256

header = struct.unpack(self.deltaheader, headerdata)

256

header = struct.unpack(self.deltaheader, headerdata)

257

delta = readexactly(self._stream, l - self.deltaheadersize)

257

delta = readexactly(self._stream, l - self.deltaheadersize)

258

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

258

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

259

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

259

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

260

'deltabase': deltabase, 'delta': delta}

260

'deltabase': deltabase, 'delta': delta}

261

262

def getchunks(self):

262

def getchunks(self):

263

"""returns all the chunks contains in the bundle

263

"""returns all the chunks contains in the bundle

264

265

Used when you need to forward the binary stream to a file or another

265

Used when you need to forward the binary stream to a file or another

266

network API. To do so, it parse the changegroup data, otherwise it will

266

network API. To do so, it parse the changegroup data, otherwise it will

267

block in case of sshrepo because it don't know the end of the stream.

267

block in case of sshrepo because it don't know the end of the stream.

268

"""

268

"""

269

# an empty chunkgroup is the end of the changegroup

269

# an empty chunkgroup is the end of the changegroup

270

# a changegroup has at least 2 chunkgroups (changelog and manifest).

270

# a changegroup has at least 2 chunkgroups (changelog and manifest).

271

# after that, an empty chunkgroup is the end of the changegroup

271

# after that, an empty chunkgroup is the end of the changegroup

272

empty = False

272

empty = False

273

count = 0

273

count = 0

274

while not empty or count <= 2:

274

while not empty or count <= 2:

275

empty = True

275

empty = True

276

count += 1

276

count += 1

277

while True:

277

while True:

278

chunk = getchunk(self)

278

chunk = getchunk(self)

279

if not chunk:

279

if not chunk:

280

break

280

break

281

empty = False

281

empty = False

282

yield chunkheader(len(chunk))

282

yield chunkheader(len(chunk))

283

pos = 0

283

pos = 0

284

while pos < len(chunk):

284

while pos < len(chunk):

285

next = pos + 2**20

285

next = pos + 2**20

286

yield chunk[pos:next]

286

yield chunk[pos:next]

287

pos = next

287

pos = next

288

yield closechunk()

288

yield closechunk()

289

290

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

290

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

291

# We know that we'll never have more manifests than we had

291

# We know that we'll never have more manifests than we had

292

# changesets.

292

# changesets.

293

self.callback = prog(_('manifests'), numchanges)

293

self.callback = prog(_('manifests'), numchanges)

294

# no need to check for empty manifest group here:

294

# no need to check for empty manifest group here:

295

# if the result of the merge of 1 and 2 is the same in 3 and 4,

295

# if the result of the merge of 1 and 2 is the same in 3 and 4,

296

# no new manifest will be created and the manifest group will

296

# no new manifest will be created and the manifest group will

297

# be empty during the pull

297

# be empty during the pull

298

self.manifestheader()

298

self.manifestheader()

299

repo.manifest.addgroup(self, revmap, trp)

299

repo.manifest.addgroup(self, revmap, trp)

300

repo.ui.progress(_('manifests'), None)

300

repo.ui.progress(_('manifests'), None)

301

302

def apply(self, repo, srctype, url, emptyok=False,

302

def apply(self, repo, srctype, url, emptyok=False,

303

targetphase=phases.draft, expectedtotal=None):

303

targetphase=phases.draft, expectedtotal=None):

304

"""Add the changegroup returned by source.read() to this repo.

304

"""Add the changegroup returned by source.read() to this repo.

305

srctype is a string like 'push', 'pull', or 'unbundle'. url is

305

srctype is a string like 'push', 'pull', or 'unbundle'. url is

306

the URL of the repo where this changegroup is coming from.

306

the URL of the repo where this changegroup is coming from.

307

308

Return an integer summarizing the change to this repo:

308

Return an integer summarizing the change to this repo:

309

- nothing changed or no source: 0

309

- nothing changed or no source: 0

310

- more heads than before: 1+added heads (2..n)

310

- more heads than before: 1+added heads (2..n)

311

- fewer heads than before: -1-removed heads (-2..-n)

311

- fewer heads than before: -1-removed heads (-2..-n)

312

- number of heads stays the same: 1

312

- number of heads stays the same: 1

313

"""

313

"""

314

repo = repo.unfiltered()

314

repo = repo.unfiltered()

315

wasempty = (len(repo.changelog) == 0)

315

wasempty = (len(repo.changelog) == 0)

316

def csmap(x):

316

def csmap(x):

317

repo.ui.debug("add changeset %s\n" % short(x))

317

repo.ui.debug("add changeset %s\n" % short(x))

318

return len(cl)

318

return len(cl)

319

320

def revmap(x):

320

def revmap(x):

321

return cl.rev(x)

321

return cl.rev(x)

322

323

changesets = files = revisions = 0

323

changesets = files = revisions = 0

324

325

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

325

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

326

try:

326

try:

327

# The transaction could have been created before and already

327

# The transaction could have been created before and already

328

# carries source information. In this case we use the top

328

# carries source information. In this case we use the top

329

# level data. We overwrite the argument because we need to use

329

# level data. We overwrite the argument because we need to use

330

# the top level value (if they exist) in this function.

330

# the top level value (if they exist) in this function.

331

srctype = tr.hookargs.setdefault('source', srctype)

331

srctype = tr.hookargs.setdefault('source', srctype)

332

url = tr.hookargs.setdefault('url', url)

332

url = tr.hookargs.setdefault('url', url)

333

repo.hook('prechangegroup', throw=True, **tr.hookargs)

333

repo.hook('prechangegroup', throw=True, **tr.hookargs)

334

335

# write changelog data to temp files so concurrent readers

335

# write changelog data to temp files so concurrent readers

336

# will not see an inconsistent view

336

# will not see an inconsistent view

337

cl = repo.changelog

337

cl = repo.changelog

338

cl.delayupdate(tr)

338

cl.delayupdate(tr)

339

oldheads = cl.heads()

339

oldheads = cl.heads()

340

341

trp = weakref.proxy(tr)

341

trp = weakref.proxy(tr)

342

# pull off the changeset group

342

# pull off the changeset group

343

repo.ui.status(_("adding changesets\n"))

343

repo.ui.status(_("adding changesets\n"))

344

clstart = len(cl)

344

clstart = len(cl)

345

class prog(object):

345

class prog(object):

346

def __init__(self, step, total):

346

def __init__(self, step, total):

347

self._step = step

347

self._step = step

348

self._total = total

348

self._total = total

349

self._count = 1

349

self._count = 1

350

def __call__(self):

350

def __call__(self):

351

repo.ui.progress(self._step, self._count, unit=_('chunks'),

351

repo.ui.progress(self._step, self._count, unit=_('chunks'),

352

total=self._total)

352

total=self._total)

353

self._count += 1

353

self._count += 1

354

self.callback = prog(_('changesets'), expectedtotal)

354

self.callback = prog(_('changesets'), expectedtotal)

355

356

efiles = set()

356

efiles = set()

357

def onchangelog(cl, node):

357

def onchangelog(cl, node):

358

efiles.update(cl.read(node)[3])

358

efiles.update(cl.read(node)[3])

359

360

self.changelogheader()

360

self.changelogheader()

361

srccontent = cl.addgroup(self, csmap, trp,

361

srccontent = cl.addgroup(self, csmap, trp,

362

addrevisioncb=onchangelog)

362

addrevisioncb=onchangelog)

363

efiles = len(efiles)

363

efiles = len(efiles)

364

365

if not (srccontent or emptyok):

365

if not (srccontent or emptyok):

366

raise error.Abort(_("received changelog group is empty"))

366

raise error.Abort(_("received changelog group is empty"))

367

clend = len(cl)

367

clend = len(cl)

368

changesets = clend - clstart

368

changesets = clend - clstart

369

repo.ui.progress(_('changesets'), None)

369

repo.ui.progress(_('changesets'), None)

370

371

# pull off the manifest group

371

# pull off the manifest group

372

repo.ui.status(_("adding manifests\n"))

372

repo.ui.status(_("adding manifests\n"))

373

self._unpackmanifests(repo, revmap, trp, prog, changesets)

373

self._unpackmanifests(repo, revmap, trp, prog, changesets)

374

375

needfiles = {}

375

needfiles = {}

376

if repo.ui.configbool('server', 'validate', default=False):

376

if repo.ui.configbool('server', 'validate', default=False):

377

# validate incoming csets have their manifests

377

# validate incoming csets have their manifests

378

for cset in xrange(clstart, clend):

378

for cset in xrange(clstart, clend):

379

mfnode = repo.changelog.read(repo.changelog.node(cset))[0]

379

mfnode = repo.changelog.read(repo.changelog.node(cset))[0]

380

mfest = repo.manifest.readdelta(mfnode)

380

mfest = repo.manifest.readdelta(mfnode)

381

# store file nodes we must see

381

# store file nodes we must see

382

for f, n in mfest.iteritems():

382

for f, n in mfest.iteritems():

383

needfiles.setdefault(f, set()).add(n)

383

needfiles.setdefault(f, set()).add(n)

384

385

# process the files

385

# process the files

386

repo.ui.status(_("adding file changes\n"))

386

repo.ui.status(_("adding file changes\n"))

387

self.callback = None

387

self.callback = None

388

pr = prog(_('files'), efiles)

388

pr = prog(_('files'), efiles)

389

newrevs, newfiles = _addchangegroupfiles(

389

newrevs, newfiles = _addchangegroupfiles(

390

repo, self, revmap, trp, pr, needfiles, wasempty)

390

repo, self, revmap, trp, pr, needfiles, wasempty)

391

revisions += newrevs

391

revisions += newrevs

392

files += newfiles

392

files += newfiles

393

394

dh = 0

394

dh = 0

395

if oldheads:

395

if oldheads:

396

heads = cl.heads()

396

heads = cl.heads()

397

dh = len(heads) - len(oldheads)

397

dh = len(heads) - len(oldheads)

398

for h in heads:

398

for h in heads:

399

if h not in oldheads and repo[h].closesbranch():

399

if h not in oldheads and repo[h].closesbranch():

400

dh -= 1

400

dh -= 1

401

htext = ""

401

htext = ""

402

if dh:

402

if dh:

403

htext = _(" (%+d heads)") % dh

403

htext = _(" (%+d heads)") % dh

404

405

repo.ui.status(_("added %d changesets"

405

repo.ui.status(_("added %d changesets"

406

" with %d changes to %d files%s\n")

406

" with %d changes to %d files%s\n")

407

% (changesets, revisions, files, htext))

407

% (changesets, revisions, files, htext))

408

repo.invalidatevolatilesets()

408

repo.invalidatevolatilesets()

409

410

if changesets > 0:

410

if changesets > 0:

411

if 'node' not in tr.hookargs:

411

if 'node' not in tr.hookargs:

412

tr.hookargs['node'] = hex(cl.node(clstart))

412

tr.hookargs['node'] = hex(cl.node(clstart))

413

hookargs = dict(tr.hookargs)

413

hookargs = dict(tr.hookargs)

414

else:

414

else:

415

hookargs = dict(tr.hookargs)

415

hookargs = dict(tr.hookargs)

416

hookargs['node'] = hex(cl.node(clstart))

416

hookargs['node'] = hex(cl.node(clstart))

417

repo.hook('pretxnchangegroup', throw=True, **hookargs)

417

repo.hook('pretxnchangegroup', throw=True, **hookargs)

418

419

added = [cl.node(r) for r in xrange(clstart, clend)]

419

added = [cl.node(r) for r in xrange(clstart, clend)]

420

publishing = repo.publishing()

420

publishing = repo.publishing()

421

if srctype in ('push', 'serve'):

421

if srctype in ('push', 'serve'):

422

# Old servers can not push the boundary themselves.

422

# Old servers can not push the boundary themselves.

423

# New servers won't push the boundary if changeset already

423

# New servers won't push the boundary if changeset already

424

# exists locally as secret

424

# exists locally as secret

425

#

425

#

426

# We should not use added here but the list of all change in

426

# We should not use added here but the list of all change in

427

# the bundle

427

# the bundle

428

if publishing:

428

if publishing:

429

phases.advanceboundary(repo, tr, phases.public, srccontent)

429

phases.advanceboundary(repo, tr, phases.public, srccontent)

430

else:

430

else:

431

# Those changesets have been pushed from the outside, their

431

# Those changesets have been pushed from the outside, their

432

# phases are going to be pushed alongside. Therefor

432

# phases are going to be pushed alongside. Therefor

433

# `targetphase` is ignored.

433

# `targetphase` is ignored.

434

phases.advanceboundary(repo, tr, phases.draft, srccontent)

434

phases.advanceboundary(repo, tr, phases.draft, srccontent)

435

phases.retractboundary(repo, tr, phases.draft, added)

435

phases.retractboundary(repo, tr, phases.draft, added)

436

elif srctype != 'strip':

436

elif srctype != 'strip':

437

# publishing only alter behavior during push

437

# publishing only alter behavior during push

438

#

438

#

439

# strip should not touch boundary at all

439

# strip should not touch boundary at all

440

phases.retractboundary(repo, tr, targetphase, added)

440

phases.retractboundary(repo, tr, targetphase, added)

441

442

if changesets > 0:

442

if changesets > 0:

443

if srctype != 'strip':

443

if srctype != 'strip':

444

# During strip, branchcache is invalid but coming call to

444

# During strip, branchcache is invalid but coming call to

445

# `destroyed` will repair it.

445

# `destroyed` will repair it.

446

# In other case we can safely update cache on disk.

446

# In other case we can safely update cache on disk.

447

branchmap.updatecache(repo.filtered('served'))

447

branchmap.updatecache(repo.filtered('served'))

448

449

def runhooks():

449

def runhooks():

450

# These hooks run when the lock releases, not when the

450

# These hooks run when the lock releases, not when the

451

# transaction closes. So it's possible for the changelog

451

# transaction closes. So it's possible for the changelog

452

# to have changed since we last saw it.

452

# to have changed since we last saw it.

453

if clstart >= len(repo):

453

if clstart >= len(repo):

454

return

454

return

455

456

# forcefully update the on-disk branch cache

456

# forcefully update the on-disk branch cache

457

repo.ui.debug("updating the branch cache\n")

457

repo.ui.debug("updating the branch cache\n")

458

repo.hook("changegroup", **hookargs)

458

repo.hook("changegroup", **hookargs)

459

460

for n in added:

460

for n in added:

461

args = hookargs.copy()

461

args = hookargs.copy()

462

args['node'] = hex(n)

462

args['node'] = hex(n)

463

repo.hook("incoming", **args)

463

repo.hook("incoming", **args)

464

465

newheads = [h for h in repo.heads() if h not in oldheads]

465

newheads = [h for h in repo.heads() if h not in oldheads]

466

repo.ui.log("incoming",

466

repo.ui.log("incoming",

467

"%s incoming changes - new heads: %s\n",

467

"%s incoming changes - new heads: %s\n",

468

len(added),

468

len(added),

469

', '.join([hex(c[:6]) for c in newheads]))

469

', '.join([hex(c[:6]) for c in newheads]))

470

471

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

471

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

472

lambda tr: repo._afterlock(runhooks))

472

lambda tr: repo._afterlock(runhooks))

473

474

tr.close()

474

tr.close()

475

476

finally:

476

finally:

477

tr.release()

477

tr.release()

478

repo.ui.flush()

478

repo.ui.flush()

479

# never return 0 here:

479

# never return 0 here:

480

if dh < 0:

480

if dh < 0:

481

return dh - 1

481

return dh - 1

482

else:

482

else:

483

return dh + 1

483

return dh + 1

484

485

class cg2unpacker(cg1unpacker):

485

class cg2unpacker(cg1unpacker):

486

"""Unpacker for cg2 streams.

486

"""Unpacker for cg2 streams.

487

488

cg2 streams add support for generaldelta, so the delta header

488

cg2 streams add support for generaldelta, so the delta header

489

format is slightly different. All other features about the data

489

format is slightly different. All other features about the data

490

remain the same.

490

remain the same.

491

"""

491

"""

492

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

492

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

493

deltaheadersize = struct.calcsize(deltaheader)

493

deltaheadersize = struct.calcsize(deltaheader)

494

version = '02'

494

version = '02'

495

496

def _deltaheader(self, headertuple, prevnode):

496

def _deltaheader(self, headertuple, prevnode):

497

node, p1, p2, deltabase, cs = headertuple

497

node, p1, p2, deltabase, cs = headertuple

498

return node, p1, p2, deltabase, cs

498

return node, p1, p2, deltabase, cs

499

500

class headerlessfixup(object):

500

class headerlessfixup(object):

501

def __init__(self, fh, h):

501

def __init__(self, fh, h):

502

self._h = h

502

self._h = h

503

self._fh = fh

503

self._fh = fh

504

def read(self, n):

504

def read(self, n):

505

if self._h:

505

if self._h:

506

d, self._h = self._h[:n], self._h[n:]

506

d, self._h = self._h[:n], self._h[n:]

507

if len(d) < n:

507

if len(d) < n:

508

d += readexactly(self._fh, n - len(d))

508

d += readexactly(self._fh, n - len(d))

509

return d

509

return d

510

return readexactly(self._fh, n)

510

return readexactly(self._fh, n)

511

512

class cg1packer(object):

512

class cg1packer(object):

513

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

513

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

514

version = '01'

514

version = '01'

515

def __init__(self, repo, bundlecaps=None):

515

def __init__(self, repo, bundlecaps=None):

516

"""Given a source repo, construct a bundler.

516

"""Given a source repo, construct a bundler.

517

518

bundlecaps is optional and can be used to specify the set of

518

bundlecaps is optional and can be used to specify the set of

519

capabilities which can be used to build the bundle.

519

capabilities which can be used to build the bundle.

520

"""

520

"""

521

# Set of capabilities we can use to build the bundle.

521

# Set of capabilities we can use to build the bundle.

522

if bundlecaps is None:

522

if bundlecaps is None:

523

bundlecaps = set()

523

bundlecaps = set()

524

self._bundlecaps = bundlecaps

524

self._bundlecaps = bundlecaps

525

# experimental config: bundle.reorder

525

# experimental config: bundle.reorder

526

reorder = repo.ui.config('bundle', 'reorder', 'auto')

526

reorder = repo.ui.config('bundle', 'reorder', 'auto')

527

if reorder == 'auto':

527

if reorder == 'auto':

528

reorder = None

528

reorder = None

529

else:

529

else:

530

reorder = util.parsebool(reorder)

530

reorder = util.parsebool(reorder)

531

self._repo = repo

531

self._repo = repo

532

self._reorder = reorder

532

self._reorder = reorder

533

self._progress = repo.ui.progress

533

self._progress = repo.ui.progress

534

if self._repo.ui.verbose and not self._repo.ui.debugflag:

534

if self._repo.ui.verbose and not self._repo.ui.debugflag:

535

self._verbosenote = self._repo.ui.note

535

self._verbosenote = self._repo.ui.note

536

else:

536

else:

537

self._verbosenote = lambda s: None

537

self._verbosenote = lambda s: None

538

539

def close(self):

539

def close(self):

540

return closechunk()

540

return closechunk()

541

542

def fileheader(self, fname):

542

def fileheader(self, fname):

543

return chunkheader(len(fname)) + fname

543

return chunkheader(len(fname)) + fname

544

545

def group(self, nodelist, revlog, lookup, units=None):

545

def group(self, nodelist, revlog, lookup, units=None):

546

"""Calculate a delta group, yielding a sequence of changegroup chunks

546

"""Calculate a delta group, yielding a sequence of changegroup chunks

547

(strings).

547

(strings).

548

549

Given a list of changeset revs, return a set of deltas and

549

Given a list of changeset revs, return a set of deltas and

550

metadata corresponding to nodes. The first delta is

550

metadata corresponding to nodes. The first delta is

551

first parent(nodelist[0]) -> nodelist[0], the receiver is

551

first parent(nodelist[0]) -> nodelist[0], the receiver is

552

guaranteed to have this parent as it has all history before

552

guaranteed to have this parent as it has all history before

553

these changesets. In the case firstparent is nullrev the

553

these changesets. In the case firstparent is nullrev the

554

changegroup starts with a full revision.

554

changegroup starts with a full revision.

555

556

If units is not None, progress detail will be generated, units specifies

556

If units is not None, progress detail will be generated, units specifies

557

the type of revlog that is touched (changelog, manifest, etc.).

557

the type of revlog that is touched (changelog, manifest, etc.).

558

"""

558

"""

559

# if we don't have any revisions touched by these changesets, bail

559

# if we don't have any revisions touched by these changesets, bail

560

if len(nodelist) == 0:

560

if len(nodelist) == 0:

561

yield self.close()

561

yield self.close()

562

return

562

return

563

564

# for generaldelta revlogs, we linearize the revs; this will both be

564

# for generaldelta revlogs, we linearize the revs; this will both be

565

# much quicker and generate a much smaller bundle

565

# much quicker and generate a much smaller bundle

566

if (revlog._generaldelta and self._reorder is None) or self._reorder:

566

if (revlog._generaldelta and self._reorder is None) or self._reorder:

567

dag = dagutil.revlogdag(revlog)

567

dag = dagutil.revlogdag(revlog)

568

revs = set(revlog.rev(n) for n in nodelist)

568

revs = set(revlog.rev(n) for n in nodelist)

569

revs = dag.linearize(revs)

569

revs = dag.linearize(revs)

570

else:

570

else:

571

revs = sorted([revlog.rev(n) for n in nodelist])

571

revs = sorted([revlog.rev(n) for n in nodelist])

572

573

# add the parent of the first rev

573

# add the parent of the first rev

574

p = revlog.parentrevs(revs[0])[0]

574

p = revlog.parentrevs(revs[0])[0]

575

revs.insert(0, p)

575

revs.insert(0, p)

576

577

# build deltas

577

# build deltas

578

total = len(revs) - 1

578

total = len(revs) - 1

579

msgbundling = _('bundling')

579

msgbundling = _('bundling')

580

for r in xrange(len(revs) - 1):

580

for r in xrange(len(revs) - 1):

581

if units is not None:

581

if units is not None:

582

self._progress(msgbundling, r + 1, unit=units, total=total)

582

self._progress(msgbundling, r + 1, unit=units, total=total)

583

prev, curr = revs[r], revs[r + 1]

583

prev, curr = revs[r], revs[r + 1]

584

linknode = lookup(revlog.node(curr))

584

linknode = lookup(revlog.node(curr))

585

for c in self.revchunk(revlog, curr, prev, linknode):

585

for c in self.revchunk(revlog, curr, prev, linknode):

586

yield c

586

yield c

587

588

if units is not None:

588

if units is not None:

589

self._progress(msgbundling, None)

589

self._progress(msgbundling, None)

590

yield self.close()

590

yield self.close()

591

592

# filter any nodes that claim to be part of the known set

592

# filter any nodes that claim to be part of the known set

593

def prune(self, revlog, missing, commonrevs):

593

def prune(self, revlog, missing, commonrevs):

594

rr, rl = revlog.rev, revlog.linkrev

594

rr, rl = revlog.rev, revlog.linkrev

595

return [n for n in missing if rl(rr(n)) not in commonrevs]

595

return [n for n in missing if rl(rr(n)) not in commonrevs]

596

597

def _packmanifests(self, mfnodes, lookuplinknode):

597

def _packmanifests(self, mfnodes, lookuplinknode):

598

"""Pack flat manifests into a changegroup stream."""

598

"""Pack flat manifests into a changegroup stream."""

599

ml = self._repo.manifest

599

ml = self._repo.manifest

600

size = 0

600

size = 0

601

for chunk in self.group(

601

for chunk in self.group(

602

mfnodes, ml, lookuplinknode, units=_('manifests')):

602

mfnodes, ml, lookuplinknode, units=_('manifests')):

603

size += len(chunk)

603

size += len(chunk)

604

yield chunk

604

yield chunk

605

self._verbosenote(_('%8.i (manifests)\n') % size)

605

self._verbosenote(_('%8.i (manifests)\n') % size)

606

607

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

607

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

608

'''yield a sequence of changegroup chunks (strings)'''

608

'''yield a sequence of changegroup chunks (strings)'''

609

repo = self._repo

609

repo = self._repo

610

cl = repo.changelog

610

cl = repo.changelog

611

ml = repo.manifest

611

ml = repo.manifest

612

613

clrevorder = {}

613

clrevorder = {}

614

mfs = {} # needed manifests

614

mfs = {} # needed manifests

615

fnodes = {} # needed file nodes

615

fnodes = {} # needed file nodes

616

# maps manifest node id -> set(changed files)

616

# maps manifest node id -> set(changed files)

617

mfchangedfiles = {}

617

mfchangedfiles = {}

618

619

# Callback for the changelog, used to collect changed files and manifest

619

# Callback for the changelog, used to collect changed files and manifest

620

# nodes.

620

# nodes.

621

# Returns the linkrev node (identity in the changelog case).

621

# Returns the linkrev node (identity in the changelog case).

622

def lookupcl(x):

622

def lookupcl(x):

623

c = cl.read(x)

623

c = cl.read(x)

624

clrevorder[x] = len(clrevorder)

624

clrevorder[x] = len(clrevorder)

625

n = c[0]

625

n = c[0]

626

# record the first changeset introducing this manifest version

626

# record the first changeset introducing this manifest version

627

mfs.setdefault(n, x)

627

mfs.setdefault(n, x)

628

# Record a complete list of potentially-changed files in

628

# Record a complete list of potentially-changed files in

629

# this manifest.

629

# this manifest.

630

mfchangedfiles.setdefault(n, set()).update(c[3])

630

mfchangedfiles.setdefault(n, set()).update(c[3])

631

return x

631

return x

632

633

self._verbosenote(_('uncompressed size of bundle content:\n'))

633

self._verbosenote(_('uncompressed size of bundle content:\n'))

634

size = 0

634

size = 0

635

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

635

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

636

size += len(chunk)

636

size += len(chunk)

637

yield chunk

637

yield chunk

638

self._verbosenote(_('%8.i (changelog)\n') % size)

638

self._verbosenote(_('%8.i (changelog)\n') % size)

639

640

# We need to make sure that the linkrev in the changegroup refers to

640

# We need to make sure that the linkrev in the changegroup refers to

641

# the first changeset that introduced the manifest or file revision.

641

# the first changeset that introduced the manifest or file revision.

642

# The fastpath is usually safer than the slowpath, because the filelogs

642

# The fastpath is usually safer than the slowpath, because the filelogs

643

# are walked in revlog order.

643

# are walked in revlog order.

644

#

644

#

645

# When taking the slowpath with reorder=None and the manifest revlog

645

# When taking the slowpath with reorder=None and the manifest revlog

646

# uses generaldelta, the manifest may be walked in the "wrong" order.

646

# uses generaldelta, the manifest may be walked in the "wrong" order.

647

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

647

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

648

# cc0ff93d0c0c).

648

# cc0ff93d0c0c).

649

#

649

#

650

# When taking the fastpath, we are only vulnerable to reordering

650

# When taking the fastpath, we are only vulnerable to reordering

651

# of the changelog itself. The changelog never uses generaldelta, so

651

# of the changelog itself. The changelog never uses generaldelta, so

652

# it is only reordered when reorder=True. To handle this case, we

652

# it is only reordered when reorder=True. To handle this case, we

653

# simply take the slowpath, which already has the 'clrevorder' logic.

653

# simply take the slowpath, which already has the 'clrevorder' logic.

654

# This was also fixed in cc0ff93d0c0c.

654

# This was also fixed in cc0ff93d0c0c.

655

fastpathlinkrev = fastpathlinkrev and not self._reorder

655

fastpathlinkrev = fastpathlinkrev and not self._reorder

656

# Callback for the manifest, used to collect linkrevs for filelog

656

# Callback for the manifest, used to collect linkrevs for filelog

657

# revisions.

657

# revisions.

658

# Returns the linkrev node (collected in lookupcl).

658

# Returns the linkrev node (collected in lookupcl).

659

def lookupmflinknode(x):

659

def lookupmflinknode(x):

660

"""Callback for looking up the linknode for manifests.

660

"""Callback for looking up the linknode for manifests.

661

662

Returns the linkrev node for the specified manifest.

662

Returns the linkrev node for the specified manifest.

663

664

SIDE EFFECT:

664

SIDE EFFECT:

665

666

fclnodes gets populated with the list of relevant

666

fclnodes gets populated with the list of relevant

667

file nodes if we're not using fastpathlinkrev.

667

file nodes if we're not using fastpathlinkrev.

668

669

Note that this means you can't trust fclnodes until

669

Note that this means you can't trust fclnodes until

670

after manifests have been sent to the client.

670

after manifests have been sent to the client.

671

"""

671

"""

672

clnode = mfs[x]

672

clnode = mfs[x]

673

if not fastpathlinkrev:

673

if not fastpathlinkrev:

674

mdata = ml.readfast(x)

674

mdata = ml.readfast(x)

675

for f in mfchangedfiles[x]:

675

for f in mfchangedfiles[x]:

676

if ~~True~~:

676

try:

677

~~try~~:

677

n = mdata[f]

678

n = mdata[f]

678

except KeyError:

679

~~except~~ ~~KeyError~~:

679

continue

680

continue

680

# record the first changeset introducing this filelog

681

# record the first changeset introducing this filelog

681

# version

682

# version

682

fclnodes = fnodes.setdefault(f, {})

683

fclnodes = fnodes.setdefault(f, {})

683

fclnode = fclnodes.setdefault(n, clnode)

684

fclnode = fclnodes.setdefault(n, clnode)

684

if clrevorder[clnode] < clrevorder[fclnode]:

685

if clrevorder[clnode] < clrevorder[fclnode]:

685

fclnodes[n] = clnode

686

fclnodes[n] = clnode

687

return clnode

686

return clnode

688

687

689

mfnodes = self.prune(ml, mfs, commonrevs)

688

mfnodes = self.prune(ml, mfs, commonrevs)

690

for x in self._packmanifests(mfnodes, lookupmflinknode):

689

for x in self._packmanifests(mfnodes, lookupmflinknode):

691

yield x

690

yield x

692

691

693

mfs.clear()

692

mfs.clear()

694

clrevs = set(cl.rev(x) for x in clnodes)

693

clrevs = set(cl.rev(x) for x in clnodes)

695

694

696

def linknodes(filerevlog, fname):

695

def linknodes(filerevlog, fname):

697

if fastpathlinkrev:

696

if fastpathlinkrev:

698

llr = filerevlog.linkrev

697

llr = filerevlog.linkrev

699

def genfilenodes():

698

def genfilenodes():

700

for r in filerevlog:

699

for r in filerevlog:

701

linkrev = llr(r)

700

linkrev = llr(r)

702

if linkrev in clrevs:

701

if linkrev in clrevs:

703

yield filerevlog.node(r), cl.node(linkrev)

702

yield filerevlog.node(r), cl.node(linkrev)

704

return dict(genfilenodes())

703

return dict(genfilenodes())

705

return fnodes.get(fname, {})

704

return fnodes.get(fname, {})

706

705

707

changedfiles = set()

706

changedfiles = set()

708

for x in mfchangedfiles.itervalues():

707

for x in mfchangedfiles.itervalues():

709

changedfiles.update(x)

708

changedfiles.update(x)

710

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

709

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

711

source):

710

source):

712

yield chunk

711

yield chunk

713

712

714

yield self.close()

713

yield self.close()

715

714

716

if clnodes:

715

if clnodes:

717

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

716

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

718

717

719

# The 'source' parameter is useful for extensions

718

# The 'source' parameter is useful for extensions

720

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

719

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

721

repo = self._repo

720

repo = self._repo

722

progress = self._progress

721

progress = self._progress

723

msgbundling = _('bundling')

722

msgbundling = _('bundling')

724

723

725

total = len(changedfiles)

724

total = len(changedfiles)

726

# for progress output

725

# for progress output

727

msgfiles = _('files')

726

msgfiles = _('files')

728

for i, fname in enumerate(sorted(changedfiles)):

727

for i, fname in enumerate(sorted(changedfiles)):

729

filerevlog = repo.file(fname)

728

filerevlog = repo.file(fname)

730

if not filerevlog:

729

if not filerevlog:

731

raise error.Abort(_("empty or missing revlog for %s") % fname)

730

raise error.Abort(_("empty or missing revlog for %s") % fname)

732

731

733

linkrevnodes = linknodes(filerevlog, fname)

732

linkrevnodes = linknodes(filerevlog, fname)

734

# Lookup for filenodes, we collected the linkrev nodes above in the

733

# Lookup for filenodes, we collected the linkrev nodes above in the

735

# fastpath case and with lookupmf in the slowpath case.

734

# fastpath case and with lookupmf in the slowpath case.

736

def lookupfilelog(x):

735

def lookupfilelog(x):

737

return linkrevnodes[x]

736

return linkrevnodes[x]

738

737

739

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

738

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

740

if filenodes:

739

if filenodes:

741

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

740

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

742

total=total)

741

total=total)

743

h = self.fileheader(fname)

742

h = self.fileheader(fname)

744

size = len(h)

743

size = len(h)

745

yield h

744

yield h

746

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

745

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

747

size += len(chunk)

746

size += len(chunk)

748

yield chunk

747

yield chunk

749

self._verbosenote(_('%8.i %s\n') % (size, fname))

748

self._verbosenote(_('%8.i %s\n') % (size, fname))

750

progress(msgbundling, None)

749

progress(msgbundling, None)

751

750

752

def deltaparent(self, revlog, rev, p1, p2, prev):

751

def deltaparent(self, revlog, rev, p1, p2, prev):

753

return prev

752

return prev

754

753

755

def revchunk(self, revlog, rev, prev, linknode):

754

def revchunk(self, revlog, rev, prev, linknode):

756

node = revlog.node(rev)

755

node = revlog.node(rev)

757

p1, p2 = revlog.parentrevs(rev)

756

p1, p2 = revlog.parentrevs(rev)

758

base = self.deltaparent(revlog, rev, p1, p2, prev)

757

base = self.deltaparent(revlog, rev, p1, p2, prev)

759

758

760

prefix = ''

759

prefix = ''

761

if revlog.iscensored(base) or revlog.iscensored(rev):

760

if revlog.iscensored(base) or revlog.iscensored(rev):

762

try:

761

try:

763

delta = revlog.revision(node)

762

delta = revlog.revision(node)

764

except error.CensoredNodeError as e:

763

except error.CensoredNodeError as e:

765

delta = e.tombstone

764

delta = e.tombstone

766

if base == nullrev:

765

if base == nullrev:

767

prefix = mdiff.trivialdiffheader(len(delta))

766

prefix = mdiff.trivialdiffheader(len(delta))

768

else:

767

else:

769

baselen = revlog.rawsize(base)

768

baselen = revlog.rawsize(base)

770

prefix = mdiff.replacediffheader(baselen, len(delta))

769

prefix = mdiff.replacediffheader(baselen, len(delta))

771

elif base == nullrev:

770

elif base == nullrev:

772

delta = revlog.revision(node)

771

delta = revlog.revision(node)

773

prefix = mdiff.trivialdiffheader(len(delta))

772

prefix = mdiff.trivialdiffheader(len(delta))

774

else:

773

else:

775

delta = revlog.revdiff(base, rev)

774

delta = revlog.revdiff(base, rev)

776

p1n, p2n = revlog.parents(node)

775

p1n, p2n = revlog.parents(node)

777

basenode = revlog.node(base)

776

basenode = revlog.node(base)

778

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

777

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

779

meta += prefix

778

meta += prefix

780

l = len(meta) + len(delta)

779

l = len(meta) + len(delta)

781

yield chunkheader(l)

780

yield chunkheader(l)

782

yield meta

781

yield meta

783

yield delta

782

yield delta

784

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

783

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

785

# do nothing with basenode, it is implicitly the previous one in HG10

784

# do nothing with basenode, it is implicitly the previous one in HG10

786

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

785

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

787

786

788

class cg2packer(cg1packer):

787

class cg2packer(cg1packer):

789

version = '02'

788

version = '02'

790

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

789

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

791

790

792

def __init__(self, repo, bundlecaps=None):

791

def __init__(self, repo, bundlecaps=None):

793

super(cg2packer, self).__init__(repo, bundlecaps)

792

super(cg2packer, self).__init__(repo, bundlecaps)

794

if self._reorder is None:

793

if self._reorder is None:

795

# Since generaldelta is directly supported by cg2, reordering

794

# Since generaldelta is directly supported by cg2, reordering

796

# generally doesn't help, so we disable it by default (treating

795

# generally doesn't help, so we disable it by default (treating

797

# bundle.reorder=auto just like bundle.reorder=False).

796

# bundle.reorder=auto just like bundle.reorder=False).

798

self._reorder = False

797

self._reorder = False

799

798

800

def deltaparent(self, revlog, rev, p1, p2, prev):

799

def deltaparent(self, revlog, rev, p1, p2, prev):

801

dp = revlog.deltaparent(rev)

800

dp = revlog.deltaparent(rev)

802

# avoid storing full revisions; pick prev in those cases

801

# avoid storing full revisions; pick prev in those cases

803

# also pick prev when we can't be sure remote has dp

802

# also pick prev when we can't be sure remote has dp

804

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

803

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

805

return prev

804

return prev

806

return dp

805

return dp

807

806

808

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

807

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

809

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

808

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

810

809

811

packermap = {'01': (cg1packer, cg1unpacker),

810

packermap = {'01': (cg1packer, cg1unpacker),

812

# cg2 adds support for exchanging generaldelta

811

# cg2 adds support for exchanging generaldelta

813

'02': (cg2packer, cg2unpacker),

812

'02': (cg2packer, cg2unpacker),

814

}

813

}

815

814

816

def _changegroupinfo(repo, nodes, source):

815

def _changegroupinfo(repo, nodes, source):

817

if repo.ui.verbose or source == 'bundle':

816

if repo.ui.verbose or source == 'bundle':

818

repo.ui.status(_("%d changesets found\n") % len(nodes))

817

repo.ui.status(_("%d changesets found\n") % len(nodes))

819

if repo.ui.debugflag:

818

if repo.ui.debugflag:

820

repo.ui.debug("list of changesets:\n")

819

repo.ui.debug("list of changesets:\n")

821

for node in nodes:

820

for node in nodes:

822

repo.ui.debug("%s\n" % hex(node))

821

repo.ui.debug("%s\n" % hex(node))

823

822

824

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

823

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

825

repo = repo.unfiltered()

824

repo = repo.unfiltered()

826

commonrevs = outgoing.common

825

commonrevs = outgoing.common

827

csets = outgoing.missing

826

csets = outgoing.missing

828

heads = outgoing.missingheads

827

heads = outgoing.missingheads

829

# We go through the fast path if we get told to, or if all (unfiltered

828

# We go through the fast path if we get told to, or if all (unfiltered

830

# heads have been requested (since we then know there all linkrevs will

829

# heads have been requested (since we then know there all linkrevs will

831

# be pulled by the client).

830

# be pulled by the client).

832

heads.sort()

831

heads.sort()

833

fastpathlinkrev = fastpath or (

832

fastpathlinkrev = fastpath or (

834

repo.filtername is None and heads == sorted(repo.heads()))

833

repo.filtername is None and heads == sorted(repo.heads()))

835

834

836

repo.hook('preoutgoing', throw=True, source=source)

835

repo.hook('preoutgoing', throw=True, source=source)

837

_changegroupinfo(repo, csets, source)

836

_changegroupinfo(repo, csets, source)

838

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

837

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

839

838

840

def getsubset(repo, outgoing, bundler, source, fastpath=False):

839

def getsubset(repo, outgoing, bundler, source, fastpath=False):

841

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

840

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

842

return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)

841

return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)

843

842

844

def changegroupsubset(repo, roots, heads, source, version='01'):

843

def changegroupsubset(repo, roots, heads, source, version='01'):

845

"""Compute a changegroup consisting of all the nodes that are

844

"""Compute a changegroup consisting of all the nodes that are

846

descendants of any of the roots and ancestors of any of the heads.

845

descendants of any of the roots and ancestors of any of the heads.

847

Return a chunkbuffer object whose read() method will return

846

Return a chunkbuffer object whose read() method will return

848

successive changegroup chunks.

847

successive changegroup chunks.

849

848

850

It is fairly complex as determining which filenodes and which

849

It is fairly complex as determining which filenodes and which

851

manifest nodes need to be included for the changeset to be complete

850

manifest nodes need to be included for the changeset to be complete

852

is non-trivial.

851

is non-trivial.

853

852

854

Another wrinkle is doing the reverse, figuring out which changeset in

853

Another wrinkle is doing the reverse, figuring out which changeset in

855

the changegroup a particular filenode or manifestnode belongs to.

854

the changegroup a particular filenode or manifestnode belongs to.

856

"""

855

"""

857

cl = repo.changelog

856

cl = repo.changelog

858

if not roots:

857

if not roots:

859

roots = [nullid]

858

roots = [nullid]

860

discbases = []

859

discbases = []

861

for n in roots:

860

for n in roots:

862

discbases.extend([p for p in cl.parents(n) if p != nullid])

861

discbases.extend([p for p in cl.parents(n) if p != nullid])

863

# TODO: remove call to nodesbetween.

862

# TODO: remove call to nodesbetween.

864

csets, roots, heads = cl.nodesbetween(roots, heads)

863

csets, roots, heads = cl.nodesbetween(roots, heads)

865

included = set(csets)

864

included = set(csets)

866

discbases = [n for n in discbases if n not in included]

865

discbases = [n for n in discbases if n not in included]

867

outgoing = discovery.outgoing(cl, discbases, heads)

866

outgoing = discovery.outgoing(cl, discbases, heads)

868

bundler = packermap[version][0](repo)

867

bundler = packermap[version][0](repo)

869

return getsubset(repo, outgoing, bundler, source)

868

return getsubset(repo, outgoing, bundler, source)

870

869

871

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

870

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

872

version='01'):

871

version='01'):

873

"""Like getbundle, but taking a discovery.outgoing as an argument.

872

"""Like getbundle, but taking a discovery.outgoing as an argument.

874

873

875

This is only implemented for local repos and reuses potentially

874

This is only implemented for local repos and reuses potentially

876

precomputed sets in outgoing. Returns a raw changegroup generator."""

875

precomputed sets in outgoing. Returns a raw changegroup generator."""

877

if not outgoing.missing:

876

if not outgoing.missing:

878

return None

877

return None

879

bundler = packermap[version][0](repo, bundlecaps)

878

bundler = packermap[version][0](repo, bundlecaps)

880

return getsubsetraw(repo, outgoing, bundler, source)

879

return getsubsetraw(repo, outgoing, bundler, source)

881

880

882

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

881

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

883

version='01'):

882

version='01'):

884

"""Like getbundle, but taking a discovery.outgoing as an argument.

883

"""Like getbundle, but taking a discovery.outgoing as an argument.

885

884

886

This is only implemented for local repos and reuses potentially

885

This is only implemented for local repos and reuses potentially

887

precomputed sets in outgoing."""

886

precomputed sets in outgoing."""

888

if not outgoing.missing:

887

if not outgoing.missing:

889

return None

888

return None

890

bundler = packermap[version][0](repo, bundlecaps)

889

bundler = packermap[version][0](repo, bundlecaps)

891

return getsubset(repo, outgoing, bundler, source)

890

return getsubset(repo, outgoing, bundler, source)

892

891

893

def computeoutgoing(repo, heads, common):

892

def computeoutgoing(repo, heads, common):

894

"""Computes which revs are outgoing given a set of common

893

"""Computes which revs are outgoing given a set of common

895

and a set of heads.

894

and a set of heads.

896

895

897

This is a separate function so extensions can have access to

896

This is a separate function so extensions can have access to

898

the logic.

897

the logic.

899

898

900

Returns a discovery.outgoing object.

899

Returns a discovery.outgoing object.

901

"""

900

"""

902

cl = repo.changelog

901

cl = repo.changelog

903

if common:

902

if common:

904

hasnode = cl.hasnode

903

hasnode = cl.hasnode

905

common = [n for n in common if hasnode(n)]

904

common = [n for n in common if hasnode(n)]

906

else:

905

else:

907

common = [nullid]

906

common = [nullid]

908

if not heads:

907

if not heads:

909

heads = cl.heads()

908

heads = cl.heads()

910

return discovery.outgoing(cl, common, heads)

909

return discovery.outgoing(cl, common, heads)

911

910

912

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

911

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

913

version='01'):

912

version='01'):

914

"""Like changegroupsubset, but returns the set difference between the

913

"""Like changegroupsubset, but returns the set difference between the

915

ancestors of heads and the ancestors common.

914

ancestors of heads and the ancestors common.

916

915

917

If heads is None, use the local heads. If common is None, use [nullid].

916

If heads is None, use the local heads. If common is None, use [nullid].

918

917

919

The nodes in common might not all be known locally due to the way the

918

The nodes in common might not all be known locally due to the way the

920

current discovery protocol works.

919

current discovery protocol works.

921

"""

920

"""

922

outgoing = computeoutgoing(repo, heads, common)

921

outgoing = computeoutgoing(repo, heads, common)

923

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

922

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

924

version=version)

923

version=version)

925

924

926

def changegroup(repo, basenodes, source):

925

def changegroup(repo, basenodes, source):

927

# to avoid a race we use changegroupsubset() (issue1320)

926

# to avoid a race we use changegroupsubset() (issue1320)

928

return changegroupsubset(repo, basenodes, repo.heads(), source)

927

return changegroupsubset(repo, basenodes, repo.heads(), source)

929

928

930

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):

929

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):

931

revisions = 0

930

revisions = 0

932

files = 0

931

files = 0

933

while True:

932

while True:

934

chunkdata = source.filelogheader()

933

chunkdata = source.filelogheader()

935

if not chunkdata:

934

if not chunkdata:

936

break

935

break

937

f = chunkdata["filename"]

936

f = chunkdata["filename"]

938

repo.ui.debug("adding %s revisions\n" % f)

937

repo.ui.debug("adding %s revisions\n" % f)

939

pr()

938

pr()

940

fl = repo.file(f)

939

fl = repo.file(f)

941

o = len(fl)

940

o = len(fl)

942

try:

941

try:

943

if not fl.addgroup(source, revmap, trp):

942

if not fl.addgroup(source, revmap, trp):

944

raise error.Abort(_("received file revlog group is empty"))

943

raise error.Abort(_("received file revlog group is empty"))

945

except error.CensoredBaseError as e:

944

except error.CensoredBaseError as e:

946

raise error.Abort(_("received delta base is censored: %s") % e)

945

raise error.Abort(_("received delta base is censored: %s") % e)

947

revisions += len(fl) - o

946

revisions += len(fl) - o

948

files += 1

947

files += 1

949

if f in needfiles:

948

if f in needfiles:

950

needs = needfiles[f]

949

needs = needfiles[f]

951

for new in xrange(o, len(fl)):

950

for new in xrange(o, len(fl)):

952

n = fl.node(new)

951

n = fl.node(new)

953

if n in needs:

952

if n in needs:

954

needs.remove(n)

953

needs.remove(n)

955

else:

954

else:

956

raise error.Abort(

955

raise error.Abort(

957

_("received spurious file revlog entry"))

956

_("received spurious file revlog entry"))

958

if not needs:

957

if not needs:

959

del needfiles[f]

958

del needfiles[f]

960

repo.ui.progress(_('files'), None)

959

repo.ui.progress(_('files'), None)

961

960

962

for f, needs in needfiles.iteritems():

961

for f, needs in needfiles.iteritems():

963

fl = repo.file(f)

962

fl = repo.file(f)

964

for n in needs:

963

for n in needs:

965

try:

964

try:

966

fl.rev(n)

965

fl.rev(n)

967

except error.LookupError:

966

except error.LookupError:

968

raise error.Abort(

967

raise error.Abort(

969

_('missing file data for %s:%s - run hg verify') %

968

_('missing file data for %s:%s - run hg verify') %

970

(f, hex(n)))

969

(f, hex(n)))

971

970

972

return revisions, files

971

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import tempfile
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from . import (
                 branchmap,
                 dagutil,
                 discovery,
                 error,
                 mdiff,
                 phases,
                 util,
             )
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             bundletypes = {
                 "": ("", None),       # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", None),
                 "HG10BZ": ("HG10", 'BZ'),
                 "HG10GZ": ("HG10GZ", 'GZ'),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 if bundletype == "HG20":
                     from . import bundle2
                     bundle = bundle2.bundle20(ui)
                     bundle.setcompression(compression)
                     part = bundle.newpart('changegroup', data=cg.getchunks())
                     part.addparam('version', cg.version)
                     chunkiter = bundle.getchunks()
                 else:
                     # compression argument is only for the bundle2 case
                     assert compression is None
                     if cg.version != '01':
                         raise error.Abort(_('old bundle types only supports v1 '
                                             'changegroups'))
                     header, comp = bundletypes[bundletype]
                     if comp not in util.compressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                           % comp)
                     z = util.compressors[comp]()
                     subchunkiter = cg.getchunks()
                     def chunkiter():
                         yield header
                         for chunk in subchunkiter:
                             yield z.compress(chunk)
                         yield z.flush()
                     chunkiter = chunkiter()
                 # parse the changegroup data, otherwise we will block
                 # in case of sshrepo because we don't know the end of the stream
                 # an empty chunkgroup is the end of the changegroup
                 # a changegroup has at least 2 chunkgroups (changelog and manifest).
                 # after that, an empty chunkgroup is the end of the changegroup
                 return writechunks(ui, chunkiter, filename, vfs=vfs)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 def __init__(self, fh, alg):
                     if alg == 'UN':
                         alg = None # get more modern without breaking too much
                     if not alg in util.decompressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     self._stream = util.decompressors[alg](fh)
                     self._type = alg
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     return node, p1, p2, deltabase, cs
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, an empty chunkgroup is the end of the changegroup
                     empty = False
                     count = 0
                     while not empty or count <= 2:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     # We know that we'll never have more manifests than we had
                     # changesets.
                     self.callback = prog(_('manifests'), numchanges)
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     repo.manifest.addgroup(self, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                 def apply(self, repo, srctype, url, emptyok=False,
                           targetphase=phases.draft, expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     wasempty = (len(repo.changelog) == 0)
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))
                     try:
                         # The transaction could have been created before and already
                         # carries source information. In this case we use the top
                         # level data. We overwrite the argument because we need to use
                         # the top level value (if they exist) in this function.
                         srctype = tr.hookargs.setdefault('source', srctype)
                         url = tr.hookargs.setdefault('url', url)
                         repo.hook('prechangegroup', throw=True, **tr.hookargs)
                         # write changelog data to temp files so concurrent readers
                         # will not see an inconsistent view
                         cl = repo.changelog
                         cl.delayupdate(tr)
                         oldheads = cl.heads()
                         trp = weakref.proxy(tr)
                         # pull off the changeset group
                         repo.ui.status(_("adding changesets\n"))
                         clstart = len(cl)
                         class prog(object):
                             def __init__(self, step, total):
                                 self._step = step
                                 self._total = total
                                 self._count = 1
                             def __call__(self):
                                 repo.ui.progress(self._step, self._count, unit=_('chunks'),
                                                  total=self._total)
                                 self._count += 1
                         self.callback = prog(_('changesets'), expectedtotal)
                         efiles = set()
                         def onchangelog(cl, node):
                             efiles.update(cl.read(node)[3])
                         self.changelogheader()
                         srccontent = cl.addgroup(self, csmap, trp,
                                                  addrevisioncb=onchangelog)
                         efiles = len(efiles)
                         if not (srccontent or emptyok):
                             raise error.Abort(_("received changelog group is empty"))
                         clend = len(cl)
                         changesets = clend - clstart
                         repo.ui.progress(_('changesets'), None)
                         # pull off the manifest group
                         repo.ui.status(_("adding manifests\n"))
                         self._unpackmanifests(repo, revmap, trp, prog, changesets)
                         needfiles = {}
                         if repo.ui.configbool('server', 'validate', default=False):
                             # validate incoming csets have their manifests
                             for cset in xrange(clstart, clend):
                                 mfnode = repo.changelog.read(repo.changelog.node(cset))[0]
                                 mfest = repo.manifest.readdelta(mfnode)
                                 # store file nodes we must see
                                 for f, n in mfest.iteritems():
                                     needfiles.setdefault(f, set()).add(n)
                         # process the files
                         repo.ui.status(_("adding file changes\n"))
                         self.callback = None
                         pr = prog(_('files'), efiles)
                         newrevs, newfiles = _addchangegroupfiles(
                             repo, self, revmap, trp, pr, needfiles, wasempty)
                         revisions += newrevs
                         files += newfiles
                         dh = 0
                         if oldheads:
                             heads = cl.heads()
                             dh = len(heads) - len(oldheads)
                             for h in heads:
                                 if h not in oldheads and repo[h].closesbranch():
                                     dh -= 1
                         htext = ""
                         if dh:
                             htext = _(" (%+d heads)") % dh
                         repo.ui.status(_("added %d changesets"
                                          " with %d changes to %d files%s\n")
                                          % (changesets, revisions, files, htext))
                         repo.invalidatevolatilesets()
                         if changesets > 0:
                             if 'node' not in tr.hookargs:
                                 tr.hookargs['node'] = hex(cl.node(clstart))
                                 hookargs = dict(tr.hookargs)
                             else:
                                 hookargs = dict(tr.hookargs)
                                 hookargs['node'] = hex(cl.node(clstart))
                             repo.hook('pretxnchangegroup', throw=True, **hookargs)
                         added = [cl.node(r) for r in xrange(clstart, clend)]
                         publishing = repo.publishing()
                         if srctype in ('push', 'serve'):
                             # Old servers can not push the boundary themselves.
                             # New servers won't push the boundary if changeset already
                             # exists locally as secret
                             #
                             # We should not use added here but the list of all change in
                             # the bundle
                             if publishing:
                                 phases.advanceboundary(repo, tr, phases.public, srccontent)
                             else:
                                 # Those changesets have been pushed from the outside, their
                                 # phases are going to be pushed alongside. Therefor
                                 # `targetphase` is ignored.
                                 phases.advanceboundary(repo, tr, phases.draft, srccontent)
                                 phases.retractboundary(repo, tr, phases.draft, added)
                         elif srctype != 'strip':
                             # publishing only alter behavior during push
                             #
                             # strip should not touch boundary at all
                             phases.retractboundary(repo, tr, targetphase, added)
                         if changesets > 0:
                             if srctype != 'strip':
                                 # During strip, branchcache is invalid but coming call to
                                 # `destroyed` will repair it.
                                 # In other case we can safely update cache on disk.
                                 branchmap.updatecache(repo.filtered('served'))
                             def runhooks():
                                 # These hooks run when the lock releases, not when the
                                 # transaction closes. So it's possible for the changelog
                                 # to have changed since we last saw it.
                                 if clstart >= len(repo):
                                     return
                                 # forcefully update the on-disk branch cache
                                 repo.ui.debug("updating the branch cache\n")
                                 repo.hook("changegroup", **hookargs)
                                 for n in added:
                                     args = hookargs.copy()
                                     args['node'] = hex(n)
                                     repo.hook("incoming", **args)
                                 newheads = [h for h in repo.heads() if h not in oldheads]
                                 repo.ui.log("incoming",
                                             "%s incoming changes - new heads: %s\n",
                                             len(added),
                                             ', '.join([hex(c[:6]) for c in newheads]))
                             tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                             lambda tr: repo._afterlock(runhooks))
                         tr.close()
                     finally:
                         tr.release()
                         repo.ui.flush()
                     # never return 0 here:
                     if dh < 0:
                         return dh - 1
                     else:
                         return dh + 1
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     return node, p1, p2, deltabase, cs
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     if units is not None:
                         self._progress(msgbundling, None)
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def _packmanifests(self, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
                     ml = self._repo.manifest
                     size = 0
                     for chunk in self.group(
                             mfnodes, ml, lookuplinknode, units=_('manifests')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     ml = repo.manifest
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     # maps manifest node id -> set(changed files)
                     mfchangedfiles = {}
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         n = c[0]
                         # record the first changeset introducing this manifest version
                         mfs.setdefault(n, x)
                         # Record a complete list of potentially-changed files in
                         # this manifest.
                         mfchangedfiles.setdefault(n, set()).update(c[3])
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def lookupmflinknode(x):
                         """Callback for looking up the linknode for manifests.
                         Returns the linkrev node for the specified manifest.
                         SIDE EFFECT:
                           fclnodes gets populated with the list of relevant
                           file nodes if we're not using fastpathlinkrev.
                         Note that this means you can't trust fclnodes until
                         after manifests have been sent to the client.
                         """
                         clnode = mfs[x]
                         if not fastpathlinkrev:
                             mdata = ml.readfast(x)
                             for f in mfchangedfiles[x]:
-                                if True:
+                                try:
-                                    try:
+                                    n = mdata[f]
-                                        n = mdata[f]
+                                except KeyError:
-                                    except KeyError:
+                                    continue
-                                        continue
+                                # record the first changeset introducing this filelog
-                                    # record the first changeset introducing this filelog
+                                # version
-                                    # version
+                                fclnodes = fnodes.setdefault(f, {})
-                                    fclnodes = fnodes.setdefault(f, {})
+                                fclnode = fclnodes.setdefault(n, clnode)
-                                    fclnode = fclnodes.setdefault(n, clnode)
+                                if clrevorder[clnode] < clrevorder[fclnode]:
-                                    if clrevorder[clnode] < clrevorder[fclnode]:
+                                    fclnodes[n] = clnode
-                                        fclnodes[n] = clnode
                         return clnode
                     mfnodes = self.prune(ml, mfs, commonrevs)
                     for x in self._packmanifests(mfnodes, lookupmflinknode):
                         yield x
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     def linknodes(filerevlog, fname):
                         if fastpathlinkrev:
                             llr = filerevlog.linkrev
                             def genfilenodes():
                                 for r in filerevlog:
                                     linkrev = llr(r)
                                     if linkrev in clrevs:
                                         yield filerevlog.node(r), cl.node(linkrev)
                             return dict(genfilenodes())
                         return fnodes.get(fname, {})
                     changedfiles = set()
                     for x in mfchangedfiles.itervalues():
                         changedfiles.update(x)
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress(msgbundling, None)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def __init__(self, repo, bundlecaps=None):
                     super(cg2packer, self).__init__(repo, bundlecaps)
                     if self._reorder is None:
                         # Since generaldelta is directly supported by cg2, reordering
                         # generally doesn't help, so we disable it by default (treating
                         # bundle.reorder=auto just like bundle.reorder=False).
                         self._reorder = False
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             packermap = {'01': (cg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (cg2packer, cg2unpacker),
             }
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return packermap[bundler.version][1](util.chunkbuffer(gengroup), None)
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 included = set(csets)
                 discbases = [n for n in discbases if n not in included]
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = packermap[version][0](repo)
                 return getsubset(repo, outgoing, bundler, source)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,
                                     version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,
                                version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,
                                            version=version)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles, wasempty):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files