upstream/mercurial-mirror Commit - r24898:0bbf0615

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

import weakref

8

import weakref

9

from i18n import _

9

from i18n import _

10

from node import nullrev, nullid, hex, short

10

from node import nullrev, nullid, hex, short

11

import mdiff, util, dagutil

11

import mdiff, util, dagutil

12

import struct, os, bz2, zlib, tempfile

12

import struct, os, bz2, zlib, tempfile

13

import discovery, error, phases, branchmap

13

import discovery, error, phases, branchmap

14

15

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

15

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

16

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

16

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

17

18

def readexactly(stream, n):

18

def readexactly(stream, n):

19

'''read n bytes from stream.read and abort if less was available'''

19

'''read n bytes from stream.read and abort if less was available'''

20

s = stream.read(n)

20

s = stream.read(n)

21

if len(s) < n:

21

if len(s) < n:

22

raise util.Abort(_("stream ended unexpectedly"

22

raise util.Abort(_("stream ended unexpectedly"

23

" (got %d bytes, expected %d)")

23

" (got %d bytes, expected %d)")

24

% (len(s), n))

24

% (len(s), n))

25

return s

25

return s

26

27

def getchunk(stream):

27

def getchunk(stream):

28

"""return the next chunk from stream as a string"""

28

"""return the next chunk from stream as a string"""

29

d = readexactly(stream, 4)

29

d = readexactly(stream, 4)

30

l = struct.unpack(">l", d)[0]

30

l = struct.unpack(">l", d)[0]

31

if l <= 4:

31

if l <= 4:

32

if l:

32

if l:

33

raise util.Abort(_("invalid chunk length %d") % l)

33

raise util.Abort(_("invalid chunk length %d") % l)

34

return ""

34

return ""

35

return readexactly(stream, l - 4)

35

return readexactly(stream, l - 4)

36

37

def chunkheader(length):

37

def chunkheader(length):

38

"""return a changegroup chunk header (string)"""

38

"""return a changegroup chunk header (string)"""

39

return struct.pack(">l", length + 4)

39

return struct.pack(">l", length + 4)

40

41

def closechunk():

41

def closechunk():

42

"""return a changegroup chunk header (string) for a zero-length chunk"""

42

"""return a changegroup chunk header (string) for a zero-length chunk"""

43

return struct.pack(">l", 0)

43

return struct.pack(">l", 0)

44

45

def combineresults(results):

45

def combineresults(results):

46

"""logic to combine 0 or more addchangegroup results into one"""

46

"""logic to combine 0 or more addchangegroup results into one"""

47

changedheads = 0

47

changedheads = 0

48

result = 1

48

result = 1

49

for ret in results:

49

for ret in results:

50

# If any changegroup result is 0, return 0

50

# If any changegroup result is 0, return 0

51

if ret == 0:

51

if ret == 0:

52

result = 0

52

result = 0

53

break

53

break

54

if ret < -1:

54

if ret < -1:

55

changedheads += ret + 1

55

changedheads += ret + 1

56

elif ret > 1:

56

elif ret > 1:

57

changedheads += ret - 1

57

changedheads += ret - 1

58

if changedheads > 0:

58

if changedheads > 0:

59

result = 1 + changedheads

59

result = 1 + changedheads

60

elif changedheads < 0:

60

elif changedheads < 0:

61

result = -1 + changedheads

61

result = -1 + changedheads

62

return result

62

return result

63

64

class nocompress(object):

64

class nocompress(object):

65

def compress(self, x):

65

def compress(self, x):

66

return x

66

return x

67

def flush(self):

67

def flush(self):

68

return ""

68

return ""

69

70

bundletypes = {

70

bundletypes = {

71

"": ("", nocompress), # only when using unbundle on ssh and old http servers

71

"": ("", nocompress), # only when using unbundle on ssh and old http servers

72

# since the unification ssh accepts a header but there

72

# since the unification ssh accepts a header but there

73

# is no capability signaling it.

73

# is no capability signaling it.

74

"HG20": (), # special-cased below

74

"HG20": (), # special-cased below

75

"HG10UN": ("HG10UN", nocompress),

75

"HG10UN": ("HG10UN", nocompress),

76

"HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),

76

"HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),

77

"HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),

77

"HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),

78

}

78

}

79

80

# hgweb uses this list to communicate its preferred type

80

# hgweb uses this list to communicate its preferred type

81

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

81

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

82

83

def writebundle(ui, cg, filename, bundletype, vfs=None):

83

def writebundle(ui, cg, filename, bundletype, vfs=None):

84

"""Write a bundle file and return its filename.

84

"""Write a bundle file and return its filename.

85

86

Existing files will not be overwritten.

86

Existing files will not be overwritten.

87

If no filename is specified, a temporary file is created.

87

If no filename is specified, a temporary file is created.

88

bz2 compression can be turned off.

88

bz2 compression can be turned off.

89

The bundle file will be deleted in case of errors.

89

The bundle file will be deleted in case of errors.

90

"""

90

"""

91

92

fh = None

92

fh = None

93

cleanup = None

93

cleanup = None

94

try:

94

try:

95

if filename:

95

if filename:

96

if vfs:

96

if vfs:

97

fh = vfs.open(filename, "wb")

97

fh = vfs.open(filename, "wb")

98

else:

98

else:

99

fh = open(filename, "wb")

99

fh = open(filename, "wb")

100

else:

100

else:

101

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

101

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

102

fh = os.fdopen(fd, "wb")

102

fh = os.fdopen(fd, "wb")

103

cleanup = filename

103

cleanup = filename

104

105

if bundletype == "HG20":

105

if bundletype == "HG20":

106

import bundle2

106

import bundle2

107

bundle = bundle2.bundle20(ui)

107

bundle = bundle2.bundle20(ui)

108

part = bundle.newpart('changegroup', data=cg.getchunks())

108

part = bundle.newpart('changegroup', data=cg.getchunks())

109

part.addparam('version', cg.version)

109

part.addparam('version', cg.version)

110

z = nocompress()

110

z = nocompress()

111

chunkiter = bundle.getchunks()

111

chunkiter = bundle.getchunks()

112

else:

112

else:

113

if cg.version != '01':

113

if cg.version != '01':

114

raise util.Abort(_('old bundle types only supports v1 '

114

raise util.Abort(_('old bundle types only supports v1 '

115

'changegroups'))

115

'changegroups'))

116

header, compressor = bundletypes[bundletype]

116

header, compressor = bundletypes[bundletype]

117

fh.write(header)

117

fh.write(header)

118

z = compressor()

118

z = compressor()

119

chunkiter = cg.getchunks()

119

chunkiter = cg.getchunks()

120

121

# parse the changegroup data, otherwise we will block

121

# parse the changegroup data, otherwise we will block

122

# in case of sshrepo because we don't know the end of the stream

122

# in case of sshrepo because we don't know the end of the stream

123

124

# an empty chunkgroup is the end of the changegroup

124

# an empty chunkgroup is the end of the changegroup

125

# a changegroup has at least 2 chunkgroups (changelog and manifest).

125

# a changegroup has at least 2 chunkgroups (changelog and manifest).

126

# after that, an empty chunkgroup is the end of the changegroup

126

# after that, an empty chunkgroup is the end of the changegroup

127

for chunk in chunkiter:

127

for chunk in chunkiter:

128

fh.write(z.compress(chunk))

128

fh.write(z.compress(chunk))

129

fh.write(z.flush())

129

fh.write(z.flush())

130

cleanup = None

130

cleanup = None

131

return filename

131

return filename

132

finally:

132

finally:

133

if fh is not None:

133

if fh is not None:

134

fh.close()

134

fh.close()

135

if cleanup is not None:

135

if cleanup is not None:

136

if filename and vfs:

136

if filename and vfs:

137

vfs.unlink(cleanup)

137

vfs.unlink(cleanup)

138

else:

138

else:

139

os.unlink(cleanup)

139

os.unlink(cleanup)

140

141

def decompressor(fh, alg):

141

def decompressor(fh, alg):

142

if alg == 'UN':

142

if alg == 'UN':

143

return fh

143

return fh

144

elif alg == 'GZ':

144

elif alg == 'GZ':

145

def generator(f):

145

def generator(f):

146

zd = zlib.decompressobj()

146

zd = zlib.decompressobj()

147

for chunk in util.filechunkiter(f):

147

for chunk in util.filechunkiter(f):

148

yield zd.decompress(chunk)

148

yield zd.decompress(chunk)

149

elif alg == 'BZ':

149

elif alg == 'BZ':

150

def generator(f):

150

def generator(f):

151

zd = bz2.BZ2Decompressor()

151

zd = bz2.BZ2Decompressor()

152

zd.decompress("BZ")

152

zd.decompress("BZ")

153

for chunk in util.filechunkiter(f, 4096):

153

for chunk in util.filechunkiter(f, 4096):

154

yield zd.decompress(chunk)

154

yield zd.decompress(chunk)

155

else:

155

else:

156

raise util.Abort("unknown bundle compression '%s'" % alg)

156

raise util.Abort("unknown bundle compression '%s'" % alg)

157

return util.chunkbuffer(generator(fh))

157

return util.chunkbuffer(generator(fh))

158

159

class cg1unpacker(object):

159

class cg1unpacker(object):

160

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

160

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

161

deltaheadersize = struct.calcsize(deltaheader)

161

deltaheadersize = struct.calcsize(deltaheader)

162

version = '01'

162

version = '01'

163

def __init__(self, fh, alg):

163

def __init__(self, fh, alg):

164

self._stream = decompressor(fh, alg)

164

self._stream = decompressor(fh, alg)

165

self._type = alg

165

self._type = alg

166

self.callback = None

166

self.callback = None

167

def compressed(self):

167

def compressed(self):

168

return self._type != 'UN'

168

return self._type != 'UN'

169

def read(self, l):

169

def read(self, l):

170

return self._stream.read(l)

170

return self._stream.read(l)

171

def seek(self, pos):

171

def seek(self, pos):

172

return self._stream.seek(pos)

172

return self._stream.seek(pos)

173

def tell(self):

173

def tell(self):

174

return self._stream.tell()

174

return self._stream.tell()

175

def close(self):

175

def close(self):

176

return self._stream.close()

176

return self._stream.close()

177

178

def chunklength(self):

178

def chunklength(self):

179

d = readexactly(self._stream, 4)

179

d = readexactly(self._stream, 4)

180

l = struct.unpack(">l", d)[0]

180

l = struct.unpack(">l", d)[0]

181

if l <= 4:

181

if l <= 4:

182

if l:

182

if l:

183

raise util.Abort(_("invalid chunk length %d") % l)

183

raise util.Abort(_("invalid chunk length %d") % l)

184

return 0

184

return 0

185

if self.callback:

185

if self.callback:

186

self.callback()

186

self.callback()

187

return l - 4

187

return l - 4

188

189

def changelogheader(self):

189

def changelogheader(self):

190

"""v10 does not have a changelog header chunk"""

190

"""v10 does not have a changelog header chunk"""

191

return {}

191

return {}

192

193

def manifestheader(self):

193

def manifestheader(self):

194

"""v10 does not have a manifest header chunk"""

194

"""v10 does not have a manifest header chunk"""

195

return {}

195

return {}

196

197

def filelogheader(self):

197

def filelogheader(self):

198

"""return the header of the filelogs chunk, v10 only has the filename"""

198

"""return the header of the filelogs chunk, v10 only has the filename"""

199

l = self.chunklength()

199

l = self.chunklength()

200

if not l:

200

if not l:

201

return {}

201

return {}

202

fname = readexactly(self._stream, l)

202

fname = readexactly(self._stream, l)

203

return {'filename': fname}

203

return {'filename': fname}

204

205

def _deltaheader(self, headertuple, prevnode):

205

def _deltaheader(self, headertuple, prevnode):

206

node, p1, p2, cs = headertuple

206

node, p1, p2, cs = headertuple

207

if prevnode is None:

207

if prevnode is None:

208

deltabase = p1

208

deltabase = p1

209

else:

209

else:

210

deltabase = prevnode

210

deltabase = prevnode

211

return node, p1, p2, deltabase, cs

211

return node, p1, p2, deltabase, cs

212

213

def deltachunk(self, prevnode):

213

def deltachunk(self, prevnode):

214

l = self.chunklength()

214

l = self.chunklength()

215

if not l:

215

if not l:

216

return {}

216

return {}

217

headerdata = readexactly(self._stream, self.deltaheadersize)

217

headerdata = readexactly(self._stream, self.deltaheadersize)

218

header = struct.unpack(self.deltaheader, headerdata)

218

header = struct.unpack(self.deltaheader, headerdata)

219

delta = readexactly(self._stream, l - self.deltaheadersize)

219

delta = readexactly(self._stream, l - self.deltaheadersize)

220

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

220

node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)

221

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

221

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

222

'deltabase': deltabase, 'delta': delta}

222

'deltabase': deltabase, 'delta': delta}

223

224

def getchunks(self):

224

def getchunks(self):

225

"""returns all the chunks contains in the bundle

225

"""returns all the chunks contains in the bundle

226

227

Used when you need to forward the binary stream to a file or another

227

Used when you need to forward the binary stream to a file or another

228

network API. To do so, it parse the changegroup data, otherwise it will

228

network API. To do so, it parse the changegroup data, otherwise it will

229

block in case of sshrepo because it don't know the end of the stream.

229

block in case of sshrepo because it don't know the end of the stream.

230

"""

230

"""

231

# an empty chunkgroup is the end of the changegroup

231

# an empty chunkgroup is the end of the changegroup

232

# a changegroup has at least 2 chunkgroups (changelog and manifest).

232

# a changegroup has at least 2 chunkgroups (changelog and manifest).

233

# after that, an empty chunkgroup is the end of the changegroup

233

# after that, an empty chunkgroup is the end of the changegroup

234

empty = False

234

empty = False

235

count = 0

235

count = 0

236

while not empty or count <= 2:

236

while not empty or count <= 2:

237

empty = True

237

empty = True

238

count += 1

238

count += 1

239

while True:

239

while True:

240

chunk = getchunk(self)

240

chunk = getchunk(self)

241

if not chunk:

241

if not chunk:

242

break

242

break

243

empty = False

243

empty = False

244

yield chunkheader(len(chunk))

244

yield chunkheader(len(chunk))

245

pos = 0

245

pos = 0

246

while pos < len(chunk):

246

while pos < len(chunk):

247

next = pos + 2**20

247

next = pos + 2**20

248

yield chunk[pos:next]

248

yield chunk[pos:next]

249

pos = next

249

pos = next

250

yield closechunk()

250

yield closechunk()

251

252

class cg2unpacker(cg1unpacker):

252

class cg2unpacker(cg1unpacker):

253

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

253

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

254

deltaheadersize = struct.calcsize(deltaheader)

254

deltaheadersize = struct.calcsize(deltaheader)

255

version = '02'

255

version = '02'

256

257

def _deltaheader(self, headertuple, prevnode):

257

def _deltaheader(self, headertuple, prevnode):

258

node, p1, p2, deltabase, cs = headertuple

258

node, p1, p2, deltabase, cs = headertuple

259

return node, p1, p2, deltabase, cs

259

return node, p1, p2, deltabase, cs

260

261

class headerlessfixup(object):

261

class headerlessfixup(object):

262

def __init__(self, fh, h):

262

def __init__(self, fh, h):

263

self._h = h

263

self._h = h

264

self._fh = fh

264

self._fh = fh

265

def read(self, n):

265

def read(self, n):

266

if self._h:

266

if self._h:

267

d, self._h = self._h[:n], self._h[n:]

267

d, self._h = self._h[:n], self._h[n:]

268

if len(d) < n:

268

if len(d) < n:

269

d += readexactly(self._fh, n - len(d))

269

d += readexactly(self._fh, n - len(d))

270

return d

270

return d

271

return readexactly(self._fh, n)

271

return readexactly(self._fh, n)

272

273

class cg1packer(object):

273

class cg1packer(object):

274

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

274

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

275

version = '01'

275

version = '01'

276

def __init__(self, repo, bundlecaps=None):

276

def __init__(self, repo, bundlecaps=None):

277

"""Given a source repo, construct a bundler.

277

"""Given a source repo, construct a bundler.

278

279

bundlecaps is optional and can be used to specify the set of

279

bundlecaps is optional and can be used to specify the set of

280

capabilities which can be used to build the bundle.

280

capabilities which can be used to build the bundle.

281

"""

281

"""

282

# Set of capabilities we can use to build the bundle.

282

# Set of capabilities we can use to build the bundle.

283

if bundlecaps is None:

283

if bundlecaps is None:

284

bundlecaps = set()

284

bundlecaps = set()

285

self._bundlecaps = bundlecaps

285

self._bundlecaps = bundlecaps

286

self._changelog = repo.changelog

286

self._changelog = repo.changelog

287

self._manifest = repo.manifest

287

self._manifest = repo.manifest

288

reorder = repo.ui.config('bundle', 'reorder', 'auto')

288

reorder = repo.ui.config('bundle', 'reorder', 'auto')

289

if reorder == 'auto':

289

if reorder == 'auto':

290

reorder = None

290

reorder = None

291

else:

291

else:

292

reorder = util.parsebool(reorder)

292

reorder = util.parsebool(reorder)

293

self._repo = repo

293

self._repo = repo

294

self._reorder = reorder

294

self._reorder = reorder

295

self._progress = repo.ui.progress

295

self._progress = repo.ui.progress

296

if self._repo.ui.verbose and not self._repo.ui.debugflag:

296

if self._repo.ui.verbose and not self._repo.ui.debugflag:

297

self._verbosenote = self._repo.ui.note

297

self._verbosenote = self._repo.ui.note

298

else:

298

else:

299

self._verbosenote = lambda s: None

299

self._verbosenote = lambda s: None

300

301

def close(self):

301

def close(self):

302

return closechunk()

302

return closechunk()

303

304

def fileheader(self, fname):

304

def fileheader(self, fname):

305

return chunkheader(len(fname)) + fname

305

return chunkheader(len(fname)) + fname

306

307

def group(self, nodelist, revlog, lookup, units=None, reorder=None):

307

def group(self, nodelist, revlog, lookup, units=None, reorder=None):

308

"""Calculate a delta group, yielding a sequence of changegroup chunks

308

"""Calculate a delta group, yielding a sequence of changegroup chunks

309

(strings).

309

(strings).

310

311

Given a list of changeset revs, return a set of deltas and

311

Given a list of changeset revs, return a set of deltas and

312

metadata corresponding to nodes. The first delta is

312

metadata corresponding to nodes. The first delta is

313

first parent(nodelist[0]) -> nodelist[0], the receiver is

313

first parent(nodelist[0]) -> nodelist[0], the receiver is

314

guaranteed to have this parent as it has all history before

314

guaranteed to have this parent as it has all history before

315

these changesets. In the case firstparent is nullrev the

315

these changesets. In the case firstparent is nullrev the

316

changegroup starts with a full revision.

316

changegroup starts with a full revision.

317

318

If units is not None, progress detail will be generated, units specifies

318

If units is not None, progress detail will be generated, units specifies

319

the type of revlog that is touched (changelog, manifest, etc.).

319

the type of revlog that is touched (changelog, manifest, etc.).

320

"""

320

"""

321

# if we don't have any revisions touched by these changesets, bail

321

# if we don't have any revisions touched by these changesets, bail

322

if len(nodelist) == 0:

322

if len(nodelist) == 0:

323

yield self.close()

323

yield self.close()

324

return

324

return

325

326

# for generaldelta revlogs, we linearize the revs; this will both be

326

# for generaldelta revlogs, we linearize the revs; this will both be

327

# much quicker and generate a much smaller bundle

327

# much quicker and generate a much smaller bundle

328

if (revlog._generaldelta and reorder is not False) or reorder:

328

if (revlog._generaldelta and reorder is not False) or reorder:

329

dag = dagutil.revlogdag(revlog)

329

dag = dagutil.revlogdag(revlog)

330

revs = set(revlog.rev(n) for n in nodelist)

330

revs = set(revlog.rev(n) for n in nodelist)

331

revs = dag.linearize(revs)

331

revs = dag.linearize(revs)

332

else:

332

else:

333

revs = sorted([revlog.rev(n) for n in nodelist])

333

revs = sorted([revlog.rev(n) for n in nodelist])

334

335

# add the parent of the first rev

335

# add the parent of the first rev

336

p = revlog.parentrevs(revs[0])[0]

336

p = revlog.parentrevs(revs[0])[0]

337

revs.insert(0, p)

337

revs.insert(0, p)

338

339

# build deltas

339

# build deltas

340

total = len(revs) - 1

340

total = len(revs) - 1

341

msgbundling = _('bundling')

341

msgbundling = _('bundling')

342

for r in xrange(len(revs) - 1):

342

for r in xrange(len(revs) - 1):

343

if units is not None:

343

if units is not None:

344

self._progress(msgbundling, r + 1, unit=units, total=total)

344

self._progress(msgbundling, r + 1, unit=units, total=total)

345

prev, curr = revs[r], revs[r + 1]

345

prev, curr = revs[r], revs[r + 1]

346

linknode = lookup(revlog.node(curr))

346

linknode = lookup(revlog.node(curr))

347

for c in self.revchunk(revlog, curr, prev, linknode):

347

for c in self.revchunk(revlog, curr, prev, linknode):

348

yield c

348

yield c

349

350

yield self.close()

350

yield self.close()

351

352

# filter any nodes that claim to be part of the known set

352

# filter any nodes that claim to be part of the known set

353

def prune(self, revlog, missing, commonrevs):

353

def prune(self, revlog, missing, commonrevs):

354

rr, rl = revlog.rev, revlog.linkrev

354

rr, rl = revlog.rev, revlog.linkrev

355

return [n for n in missing if rl(rr(n)) not in commonrevs]

355

return [n for n in missing if rl(rr(n)) not in commonrevs]

356

357

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

357

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

358

'''yield a sequence of changegroup chunks (strings)'''

358

'''yield a sequence of changegroup chunks (strings)'''

359

repo = self._repo

359

repo = self._repo

360

cl = self._changelog

360

cl = self._changelog

361

mf = self._manifest

361

mf = self._manifest

362

reorder = self._reorder

362

reorder = self._reorder

363

progress = self._progress

363

progress = self._progress

364

365

# for progress output

365

# for progress output

366

msgbundling = _('bundling')

366

msgbundling = _('bundling')

367

368

clrevorder = {}

368

clrevorder = {}

369

mfs = {} # needed manifests

369

mfs = {} # needed manifests

370

fnodes = {} # needed file nodes

370

fnodes = {} # needed file nodes

371

changedfiles = set()

371

changedfiles = set()

372

373

# Callback for the changelog, used to collect changed files and manifest

373

# Callback for the changelog, used to collect changed files and manifest

374

# nodes.

374

# nodes.

375

# Returns the linkrev node (identity in the changelog case).

375

# Returns the linkrev node (identity in the changelog case).

376

def lookupcl(x):

376

def lookupcl(x):

377

c = cl.read(x)

377

c = cl.read(x)

378

clrevorder[x] = len(clrevorder)

378

clrevorder[x] = len(clrevorder)

379

changedfiles.update(c[3])

379

changedfiles.update(c[3])

380

# record the first changeset introducing this manifest version

380

# record the first changeset introducing this manifest version

381

mfs.setdefault(c[0], x)

381

mfs.setdefault(c[0], x)

382

return x

382

return x

383

384

self._verbosenote(_('uncompressed size of bundle content:\n'))

384

self._verbosenote(_('uncompressed size of bundle content:\n'))

385

size = 0

385

size = 0

386

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets'),

386

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets'),

387

reorder=reorder):

387

reorder=reorder):

388

size += len(chunk)

388

size += len(chunk)

389

yield chunk

389

yield chunk

390

self._verbosenote(_('%8.i (changelog)\n') % size)

390

self._verbosenote(_('%8.i (changelog)\n') % size)

391

progress(msgbundling, None)

391

progress(msgbundling, None)

392

393

# Callback for the manifest, used to collect linkrevs for filelog

393

# Callback for the manifest, used to collect linkrevs for filelog

394

# revisions.

394

# revisions.

395

# Returns the linkrev node (collected in lookupcl).

395

# Returns the linkrev node (collected in lookupcl).

396

def lookupmf(x):

396

def lookupmf(x):

397

clnode = mfs[x]

397

clnode = mfs[x]

398

if not fastpathlinkrev or reorder:

398

if not fastpathlinkrev or reorder:

399

mdata = mf.readfast(x)

399

mdata = mf.readfast(x)

400

for f, n in mdata.iteritems():

400

for f, n in mdata.iteritems():

401

if f in changedfiles:

401

if f in changedfiles:

402

# record the first changeset introducing this filelog

402

# record the first changeset introducing this filelog

403

# version

403

# version

404

fclnodes = fnodes.setdefault(f, {})

404

fclnodes = fnodes.setdefault(f, {})

405

fclnode = fclnodes.setdefault(n, clnode)

405

fclnode = fclnodes.setdefault(n, clnode)

406

if clrevorder[clnode] < clrevorder[fclnode]:

406

if clrevorder[clnode] < clrevorder[fclnode]:

407

fclnodes[n] = clnode

407

fclnodes[n] = clnode

408

return clnode

408

return clnode

409

410

mfnodes = self.prune(mf, mfs, commonrevs)

410

mfnodes = self.prune(mf, mfs, commonrevs)

411

size = 0

411

size = 0

412

for chunk in self.group(mfnodes, mf, lookupmf, units=_('manifests'),

412

for chunk in self.group(mfnodes, mf, lookupmf, units=_('manifests'),

413

reorder=reorder):

413

reorder=reorder):

414

size += len(chunk)

414

size += len(chunk)

415

yield chunk

415

yield chunk

416

self._verbosenote(_('%8.i (manifests)\n') % size)

416

self._verbosenote(_('%8.i (manifests)\n') % size)

417

progress(msgbundling, None)

417

progress(msgbundling, None)

418

419

mfs.clear()

419

mfs.clear()

420

~~needed~~ = set(cl.rev(x) for x in clnodes)

420

clrevs = set(cl.rev(x) for x in clnodes)

421

422

def linknodes(filerevlog, fname):

422

def linknodes(filerevlog, fname):

423

if fastpathlinkrev and not reorder:

423

if fastpathlinkrev and not reorder:

424

llr = filerevlog.linkrev

424

llr = filerevlog.linkrev

425

def genfilenodes():

425

def genfilenodes():

426

for r in filerevlog:

426

for r in filerevlog:

427

linkrev = llr(r)

427

linkrev = llr(r)

428

if linkrev in ~~needed~~:

428

if linkrev in clrevs:

429

yield filerevlog.node(r), cl.node(linkrev)

429

yield filerevlog.node(r), cl.node(linkrev)

430

return dict(genfilenodes())

430

return dict(genfilenodes())

431

return fnodes.get(fname, {})

431

return fnodes.get(fname, {})

432

433

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

433

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

434

source):

434

source):

435

yield chunk

435

yield chunk

436

437

yield self.close()

437

yield self.close()

438

progress(msgbundling, None)

438

progress(msgbundling, None)

439

440

if clnodes:

440

if clnodes:

441

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

441

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

442

443

# The 'source' parameter is useful for extensions

443

# The 'source' parameter is useful for extensions

444

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

444

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

445

repo = self._repo

445

repo = self._repo

446

progress = self._progress

446

progress = self._progress

447

reorder = self._reorder

447

reorder = self._reorder

448

msgbundling = _('bundling')

448

msgbundling = _('bundling')

449

450

total = len(changedfiles)

450

total = len(changedfiles)

451

# for progress output

451

# for progress output

452

msgfiles = _('files')

452

msgfiles = _('files')

453

for i, fname in enumerate(sorted(changedfiles)):

453

for i, fname in enumerate(sorted(changedfiles)):

454

filerevlog = repo.file(fname)

454

filerevlog = repo.file(fname)

455

if not filerevlog:

455

if not filerevlog:

456

raise util.Abort(_("empty or missing revlog for %s") % fname)

456

raise util.Abort(_("empty or missing revlog for %s") % fname)

457

458

linkrevnodes = linknodes(filerevlog, fname)

458

linkrevnodes = linknodes(filerevlog, fname)

459

# Lookup for filenodes, we collected the linkrev nodes above in the

459

# Lookup for filenodes, we collected the linkrev nodes above in the

460

# fastpath case and with lookupmf in the slowpath case.

460

# fastpath case and with lookupmf in the slowpath case.

461

def lookupfilelog(x):

461

def lookupfilelog(x):

462

return linkrevnodes[x]

462

return linkrevnodes[x]

463

464

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

464

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

465

if filenodes:

465

if filenodes:

466

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

466

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

467

total=total)

467

total=total)

468

h = self.fileheader(fname)

468

h = self.fileheader(fname)

469

size = len(h)

469

size = len(h)

470

yield h

470

yield h

471

for chunk in self.group(filenodes, filerevlog, lookupfilelog,

471

for chunk in self.group(filenodes, filerevlog, lookupfilelog,

472

reorder=reorder):

472

reorder=reorder):

473

size += len(chunk)

473

size += len(chunk)

474

yield chunk

474

yield chunk

475

self._verbosenote(_('%8.i %s\n') % (size, fname))

475

self._verbosenote(_('%8.i %s\n') % (size, fname))

476

477

def deltaparent(self, revlog, rev, p1, p2, prev):

477

def deltaparent(self, revlog, rev, p1, p2, prev):

478

return prev

478

return prev

479

480

def revchunk(self, revlog, rev, prev, linknode):

480

def revchunk(self, revlog, rev, prev, linknode):

481

node = revlog.node(rev)

481

node = revlog.node(rev)

482

p1, p2 = revlog.parentrevs(rev)

482

p1, p2 = revlog.parentrevs(rev)

483

base = self.deltaparent(revlog, rev, p1, p2, prev)

483

base = self.deltaparent(revlog, rev, p1, p2, prev)

484

485

prefix = ''

485

prefix = ''

486

if revlog.iscensored(base) or revlog.iscensored(rev):

486

if revlog.iscensored(base) or revlog.iscensored(rev):

487

try:

487

try:

488

delta = revlog.revision(node)

488

delta = revlog.revision(node)

489

except error.CensoredNodeError, e:

489

except error.CensoredNodeError, e:

490

delta = e.tombstone

490

delta = e.tombstone

491

if base == nullrev:

491

if base == nullrev:

492

prefix = mdiff.trivialdiffheader(len(delta))

492

prefix = mdiff.trivialdiffheader(len(delta))

493

else:

493

else:

494

baselen = revlog.rawsize(base)

494

baselen = revlog.rawsize(base)

495

prefix = mdiff.replacediffheader(baselen, len(delta))

495

prefix = mdiff.replacediffheader(baselen, len(delta))

496

elif base == nullrev:

496

elif base == nullrev:

497

delta = revlog.revision(node)

497

delta = revlog.revision(node)

498

prefix = mdiff.trivialdiffheader(len(delta))

498

prefix = mdiff.trivialdiffheader(len(delta))

499

else:

499

else:

500

delta = revlog.revdiff(base, rev)

500

delta = revlog.revdiff(base, rev)

501

p1n, p2n = revlog.parents(node)

501

p1n, p2n = revlog.parents(node)

502

basenode = revlog.node(base)

502

basenode = revlog.node(base)

503

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

503

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)

504

meta += prefix

504

meta += prefix

505

l = len(meta) + len(delta)

505

l = len(meta) + len(delta)

506

yield chunkheader(l)

506

yield chunkheader(l)

507

yield meta

507

yield meta

508

yield delta

508

yield delta

509

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

509

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

510

# do nothing with basenode, it is implicitly the previous one in HG10

510

# do nothing with basenode, it is implicitly the previous one in HG10

511

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

511

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

512

513

class cg2packer(cg1packer):

513

class cg2packer(cg1packer):

514

version = '02'

514

version = '02'

515

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

515

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

516

517

def group(self, nodelist, revlog, lookup, units=None, reorder=None):

517

def group(self, nodelist, revlog, lookup, units=None, reorder=None):

518

if (revlog._generaldelta and reorder is not True):

518

if (revlog._generaldelta and reorder is not True):

519

reorder = False

519

reorder = False

520

return super(cg2packer, self).group(nodelist, revlog, lookup,

520

return super(cg2packer, self).group(nodelist, revlog, lookup,

521

units=units, reorder=reorder)

521

units=units, reorder=reorder)

522

523

def deltaparent(self, revlog, rev, p1, p2, prev):

523

def deltaparent(self, revlog, rev, p1, p2, prev):

524

dp = revlog.deltaparent(rev)

524

dp = revlog.deltaparent(rev)

525

# avoid storing full revisions; pick prev in those cases

525

# avoid storing full revisions; pick prev in those cases

526

# also pick prev when we can't be sure remote has dp

526

# also pick prev when we can't be sure remote has dp

527

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

527

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

528

return prev

528

return prev

529

return dp

529

return dp

530

531

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

531

def builddeltaheader(self, node, p1n, p2n, basenode, linknode):

532

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

532

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

533

534

packermap = {'01': (cg1packer, cg1unpacker),

534

packermap = {'01': (cg1packer, cg1unpacker),

535

'02': (cg2packer, cg2unpacker)}

535

'02': (cg2packer, cg2unpacker)}

536

537

def _changegroupinfo(repo, nodes, source):

537

def _changegroupinfo(repo, nodes, source):

538

if repo.ui.verbose or source == 'bundle':

538

if repo.ui.verbose or source == 'bundle':

539

repo.ui.status(_("%d changesets found\n") % len(nodes))

539

repo.ui.status(_("%d changesets found\n") % len(nodes))

540

if repo.ui.debugflag:

540

if repo.ui.debugflag:

541

repo.ui.debug("list of changesets:\n")

541

repo.ui.debug("list of changesets:\n")

542

for node in nodes:

542

for node in nodes:

543

repo.ui.debug("%s\n" % hex(node))

543

repo.ui.debug("%s\n" % hex(node))

544

545

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

545

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

546

repo = repo.unfiltered()

546

repo = repo.unfiltered()

547

commonrevs = outgoing.common

547

commonrevs = outgoing.common

548

csets = outgoing.missing

548

csets = outgoing.missing

549

heads = outgoing.missingheads

549

heads = outgoing.missingheads

550

# We go through the fast path if we get told to, or if all (unfiltered

550

# We go through the fast path if we get told to, or if all (unfiltered

551

# heads have been requested (since we then know there all linkrevs will

551

# heads have been requested (since we then know there all linkrevs will

552

# be pulled by the client).

552

# be pulled by the client).

553

heads.sort()

553

heads.sort()

554

fastpathlinkrev = fastpath or (

554

fastpathlinkrev = fastpath or (

555

repo.filtername is None and heads == sorted(repo.heads()))

555

repo.filtername is None and heads == sorted(repo.heads()))

556

557

repo.hook('preoutgoing', throw=True, source=source)

557

repo.hook('preoutgoing', throw=True, source=source)

558

_changegroupinfo(repo, csets, source)

558

_changegroupinfo(repo, csets, source)

559

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

559

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

560

561

def getsubset(repo, outgoing, bundler, source, fastpath=False, version='01'):

561

def getsubset(repo, outgoing, bundler, source, fastpath=False, version='01'):

562

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

562

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

563

return packermap[version][1](util.chunkbuffer(gengroup), 'UN')

563

return packermap[version][1](util.chunkbuffer(gengroup), 'UN')

564

565

def changegroupsubset(repo, roots, heads, source, version='01'):

565

def changegroupsubset(repo, roots, heads, source, version='01'):

566

"""Compute a changegroup consisting of all the nodes that are

566

"""Compute a changegroup consisting of all the nodes that are

567

descendants of any of the roots and ancestors of any of the heads.

567

descendants of any of the roots and ancestors of any of the heads.

568

Return a chunkbuffer object whose read() method will return

568

Return a chunkbuffer object whose read() method will return

569

successive changegroup chunks.

569

successive changegroup chunks.

570

571

It is fairly complex as determining which filenodes and which

571

It is fairly complex as determining which filenodes and which

572

manifest nodes need to be included for the changeset to be complete

572

manifest nodes need to be included for the changeset to be complete

573

is non-trivial.

573

is non-trivial.

574

575

Another wrinkle is doing the reverse, figuring out which changeset in

575

Another wrinkle is doing the reverse, figuring out which changeset in

576

the changegroup a particular filenode or manifestnode belongs to.

576

the changegroup a particular filenode or manifestnode belongs to.

577

"""

577

"""

578

cl = repo.changelog

578

cl = repo.changelog

579

if not roots:

579

if not roots:

580

roots = [nullid]

580

roots = [nullid]

581

# TODO: remove call to nodesbetween.

581

# TODO: remove call to nodesbetween.

582

csets, roots, heads = cl.nodesbetween(roots, heads)

582

csets, roots, heads = cl.nodesbetween(roots, heads)

583

discbases = []

583

discbases = []

584

for n in roots:

584

for n in roots:

585

discbases.extend([p for p in cl.parents(n) if p != nullid])

585

discbases.extend([p for p in cl.parents(n) if p != nullid])

586

outgoing = discovery.outgoing(cl, discbases, heads)

586

outgoing = discovery.outgoing(cl, discbases, heads)

587

bundler = packermap[version][0](repo)

587

bundler = packermap[version][0](repo)

588

return getsubset(repo, outgoing, bundler, source, version=version)

588

return getsubset(repo, outgoing, bundler, source, version=version)

589

590

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

590

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

591

version='01'):

591

version='01'):

592

"""Like getbundle, but taking a discovery.outgoing as an argument.

592

"""Like getbundle, but taking a discovery.outgoing as an argument.

593

594

This is only implemented for local repos and reuses potentially

594

This is only implemented for local repos and reuses potentially

595

precomputed sets in outgoing. Returns a raw changegroup generator."""

595

precomputed sets in outgoing. Returns a raw changegroup generator."""

596

if not outgoing.missing:

596

if not outgoing.missing:

597

return None

597

return None

598

bundler = packermap[version][0](repo, bundlecaps)

598

bundler = packermap[version][0](repo, bundlecaps)

599

return getsubsetraw(repo, outgoing, bundler, source)

599

return getsubsetraw(repo, outgoing, bundler, source)

600

601

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None):

601

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None):

602

"""Like getbundle, but taking a discovery.outgoing as an argument.

602

"""Like getbundle, but taking a discovery.outgoing as an argument.

603

604

This is only implemented for local repos and reuses potentially

604

This is only implemented for local repos and reuses potentially

605

precomputed sets in outgoing."""

605

precomputed sets in outgoing."""

606

if not outgoing.missing:

606

if not outgoing.missing:

607

return None

607

return None

608

bundler = cg1packer(repo, bundlecaps)

608

bundler = cg1packer(repo, bundlecaps)

609

return getsubset(repo, outgoing, bundler, source)

609

return getsubset(repo, outgoing, bundler, source)

610

611

def _computeoutgoing(repo, heads, common):

611

def _computeoutgoing(repo, heads, common):

612

"""Computes which revs are outgoing given a set of common

612

"""Computes which revs are outgoing given a set of common

613

and a set of heads.

613

and a set of heads.

614

615

This is a separate function so extensions can have access to

615

This is a separate function so extensions can have access to

616

the logic.

616

the logic.

617

618

Returns a discovery.outgoing object.

618

Returns a discovery.outgoing object.

619

"""

619

"""

620

cl = repo.changelog

620

cl = repo.changelog

621

if common:

621

if common:

622

hasnode = cl.hasnode

622

hasnode = cl.hasnode

623

common = [n for n in common if hasnode(n)]

623

common = [n for n in common if hasnode(n)]

624

else:

624

else:

625

common = [nullid]

625

common = [nullid]

626

if not heads:

626

if not heads:

627

heads = cl.heads()

627

heads = cl.heads()

628

return discovery.outgoing(cl, common, heads)

628

return discovery.outgoing(cl, common, heads)

629

630

def getchangegroupraw(repo, source, heads=None, common=None, bundlecaps=None,

630

def getchangegroupraw(repo, source, heads=None, common=None, bundlecaps=None,

631

version='01'):

631

version='01'):

632

"""Like changegroupsubset, but returns the set difference between the

632

"""Like changegroupsubset, but returns the set difference between the

633

ancestors of heads and the ancestors common.

633

ancestors of heads and the ancestors common.

634

635

If heads is None, use the local heads. If common is None, use [nullid].

635

If heads is None, use the local heads. If common is None, use [nullid].

636

637

If version is None, use a version '1' changegroup.

637

If version is None, use a version '1' changegroup.

638

639

The nodes in common might not all be known locally due to the way the

639

The nodes in common might not all be known locally due to the way the

640

current discovery protocol works. Returns a raw changegroup generator.

640

current discovery protocol works. Returns a raw changegroup generator.

641

"""

641

"""

642

outgoing = _computeoutgoing(repo, heads, common)

642

outgoing = _computeoutgoing(repo, heads, common)

643

return getlocalchangegroupraw(repo, source, outgoing, bundlecaps=bundlecaps,

643

return getlocalchangegroupraw(repo, source, outgoing, bundlecaps=bundlecaps,

644

version=version)

644

version=version)

645

646

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None):

646

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None):

647

"""Like changegroupsubset, but returns the set difference between the

647

"""Like changegroupsubset, but returns the set difference between the

648

ancestors of heads and the ancestors common.

648

ancestors of heads and the ancestors common.

649

650

If heads is None, use the local heads. If common is None, use [nullid].

650

If heads is None, use the local heads. If common is None, use [nullid].

651

652

The nodes in common might not all be known locally due to the way the

652

The nodes in common might not all be known locally due to the way the

653

current discovery protocol works.

653

current discovery protocol works.

654

"""

654

"""

655

outgoing = _computeoutgoing(repo, heads, common)

655

outgoing = _computeoutgoing(repo, heads, common)

656

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps)

656

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps)

657

658

def changegroup(repo, basenodes, source):

658

def changegroup(repo, basenodes, source):

659

# to avoid a race we use changegroupsubset() (issue1320)

659

# to avoid a race we use changegroupsubset() (issue1320)

660

return changegroupsubset(repo, basenodes, repo.heads(), source)

660

return changegroupsubset(repo, basenodes, repo.heads(), source)

661

662

def addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

662

def addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

663

revisions = 0

663

revisions = 0

664

files = 0

664

files = 0

665

while True:

665

while True:

666

chunkdata = source.filelogheader()

666

chunkdata = source.filelogheader()

667

if not chunkdata:

667

if not chunkdata:

668

break

668

break

669

f = chunkdata["filename"]

669

f = chunkdata["filename"]

670

repo.ui.debug("adding %s revisions\n" % f)

670

repo.ui.debug("adding %s revisions\n" % f)

671

pr()

671

pr()

672

fl = repo.file(f)

672

fl = repo.file(f)

673

o = len(fl)

673

o = len(fl)

674

try:

674

try:

675

if not fl.addgroup(source, revmap, trp):

675

if not fl.addgroup(source, revmap, trp):

676

raise util.Abort(_("received file revlog group is empty"))

676

raise util.Abort(_("received file revlog group is empty"))

677

except error.CensoredBaseError, e:

677

except error.CensoredBaseError, e:

678

raise util.Abort(_("received delta base is censored: %s") % e)

678

raise util.Abort(_("received delta base is censored: %s") % e)

679

revisions += len(fl) - o

679

revisions += len(fl) - o

680

files += 1

680

files += 1

681

if f in needfiles:

681

if f in needfiles:

682

needs = needfiles[f]

682

needs = needfiles[f]

683

for new in xrange(o, len(fl)):

683

for new in xrange(o, len(fl)):

684

n = fl.node(new)

684

n = fl.node(new)

685

if n in needs:

685

if n in needs:

686

needs.remove(n)

686

needs.remove(n)

687

else:

687

else:

688

raise util.Abort(

688

raise util.Abort(

689

_("received spurious file revlog entry"))

689

_("received spurious file revlog entry"))

690

if not needs:

690

if not needs:

691

del needfiles[f]

691

del needfiles[f]

692

repo.ui.progress(_('files'), None)

692

repo.ui.progress(_('files'), None)

693

694

for f, needs in needfiles.iteritems():

694

for f, needs in needfiles.iteritems():

695

fl = repo.file(f)

695

fl = repo.file(f)

696

for n in needs:

696

for n in needs:

697

try:

697

try:

698

fl.rev(n)

698

fl.rev(n)

699

except error.LookupError:

699

except error.LookupError:

700

raise util.Abort(

700

raise util.Abort(

701

_('missing file data for %s:%s - run hg verify') %

701

_('missing file data for %s:%s - run hg verify') %

702

(f, hex(n)))

702

(f, hex(n)))

703

704

return revisions, files

704

return revisions, files

705

706

def addchangegroup(repo, source, srctype, url, emptyok=False,

706

def addchangegroup(repo, source, srctype, url, emptyok=False,

707

targetphase=phases.draft):

707

targetphase=phases.draft):

708

"""Add the changegroup returned by source.read() to this repo.

708

"""Add the changegroup returned by source.read() to this repo.

709

srctype is a string like 'push', 'pull', or 'unbundle'. url is

709

srctype is a string like 'push', 'pull', or 'unbundle'. url is

710

the URL of the repo where this changegroup is coming from.

710

the URL of the repo where this changegroup is coming from.

711

712

Return an integer summarizing the change to this repo:

712

Return an integer summarizing the change to this repo:

713

- nothing changed or no source: 0

713

- nothing changed or no source: 0

714

- more heads than before: 1+added heads (2..n)

714

- more heads than before: 1+added heads (2..n)

715

- fewer heads than before: -1-removed heads (-2..-n)

715

- fewer heads than before: -1-removed heads (-2..-n)

716

- number of heads stays the same: 1

716

- number of heads stays the same: 1

717

"""

717

"""

718

repo = repo.unfiltered()

718

repo = repo.unfiltered()

719

def csmap(x):

719

def csmap(x):

720

repo.ui.debug("add changeset %s\n" % short(x))

720

repo.ui.debug("add changeset %s\n" % short(x))

721

return len(cl)

721

return len(cl)

722

723

def revmap(x):

723

def revmap(x):

724

return cl.rev(x)

724

return cl.rev(x)

725

726

if not source:

726

if not source:

727

return 0

727

return 0

728

729

changesets = files = revisions = 0

729

changesets = files = revisions = 0

730

efiles = set()

730

efiles = set()

731

732

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

732

tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))

733

# The transaction could have been created before and already carries source

733

# The transaction could have been created before and already carries source

734

# information. In this case we use the top level data. We overwrite the

734

# information. In this case we use the top level data. We overwrite the

735

# argument because we need to use the top level value (if they exist) in

735

# argument because we need to use the top level value (if they exist) in

736

# this function.

736

# this function.

737

srctype = tr.hookargs.setdefault('source', srctype)

737

srctype = tr.hookargs.setdefault('source', srctype)

738

url = tr.hookargs.setdefault('url', url)

738

url = tr.hookargs.setdefault('url', url)

739

740

# write changelog data to temp files so concurrent readers will not see

740

# write changelog data to temp files so concurrent readers will not see

741

# inconsistent view

741

# inconsistent view

742

cl = repo.changelog

742

cl = repo.changelog

743

cl.delayupdate(tr)

743

cl.delayupdate(tr)

744

oldheads = cl.heads()

744

oldheads = cl.heads()

745

try:

745

try:

746

repo.hook('prechangegroup', throw=True, **tr.hookargs)

746

repo.hook('prechangegroup', throw=True, **tr.hookargs)

747

748

trp = weakref.proxy(tr)

748

trp = weakref.proxy(tr)

749

# pull off the changeset group

749

# pull off the changeset group

750

repo.ui.status(_("adding changesets\n"))

750

repo.ui.status(_("adding changesets\n"))

751

clstart = len(cl)

751

clstart = len(cl)

752

class prog(object):

752

class prog(object):

753

step = _('changesets')

753

step = _('changesets')

754

count = 1

754

count = 1

755

ui = repo.ui

755

ui = repo.ui

756

total = None

756

total = None

757

def __call__(repo):

757

def __call__(repo):

758

repo.ui.progress(repo.step, repo.count, unit=_('chunks'),

758

repo.ui.progress(repo.step, repo.count, unit=_('chunks'),

759

total=repo.total)

759

total=repo.total)

760

repo.count += 1

760

repo.count += 1

761

pr = prog()

761

pr = prog()

762

source.callback = pr

762

source.callback = pr

763

764

source.changelogheader()

764

source.changelogheader()

765

srccontent = cl.addgroup(source, csmap, trp)

765

srccontent = cl.addgroup(source, csmap, trp)

766

if not (srccontent or emptyok):

766

if not (srccontent or emptyok):

767

raise util.Abort(_("received changelog group is empty"))

767

raise util.Abort(_("received changelog group is empty"))

768

clend = len(cl)

768

clend = len(cl)

769

changesets = clend - clstart

769

changesets = clend - clstart

770

for c in xrange(clstart, clend):

770

for c in xrange(clstart, clend):

771

efiles.update(repo[c].files())

771

efiles.update(repo[c].files())

772

efiles = len(efiles)

772

efiles = len(efiles)

773

repo.ui.progress(_('changesets'), None)

773

repo.ui.progress(_('changesets'), None)

774

775

# pull off the manifest group

775

# pull off the manifest group

776

repo.ui.status(_("adding manifests\n"))

776

repo.ui.status(_("adding manifests\n"))

777

pr.step = _('manifests')

777

pr.step = _('manifests')

778

pr.count = 1

778

pr.count = 1

779

pr.total = changesets # manifests <= changesets

779

pr.total = changesets # manifests <= changesets

780

# no need to check for empty manifest group here:

780

# no need to check for empty manifest group here:

781

# if the result of the merge of 1 and 2 is the same in 3 and 4,

781

# if the result of the merge of 1 and 2 is the same in 3 and 4,

782

# no new manifest will be created and the manifest group will

782

# no new manifest will be created and the manifest group will

783

# be empty during the pull

783

# be empty during the pull

784

source.manifestheader()

784

source.manifestheader()

785

repo.manifest.addgroup(source, revmap, trp)

785

repo.manifest.addgroup(source, revmap, trp)

786

repo.ui.progress(_('manifests'), None)

786

repo.ui.progress(_('manifests'), None)

787

788

needfiles = {}

788

needfiles = {}

789

if repo.ui.configbool('server', 'validate', default=False):

789

if repo.ui.configbool('server', 'validate', default=False):

790

# validate incoming csets have their manifests

790

# validate incoming csets have their manifests

791

for cset in xrange(clstart, clend):

791

for cset in xrange(clstart, clend):

792

mfest = repo.changelog.read(repo.changelog.node(cset))[0]

792

mfest = repo.changelog.read(repo.changelog.node(cset))[0]

793

mfest = repo.manifest.readdelta(mfest)

793

mfest = repo.manifest.readdelta(mfest)

794

# store file nodes we must see

794

# store file nodes we must see

795

for f, n in mfest.iteritems():

795

for f, n in mfest.iteritems():

796

needfiles.setdefault(f, set()).add(n)

796

needfiles.setdefault(f, set()).add(n)

797

798

# process the files

798

# process the files

799

repo.ui.status(_("adding file changes\n"))

799

repo.ui.status(_("adding file changes\n"))

800

pr.step = _('files')

800

pr.step = _('files')

801

pr.count = 1

801

pr.count = 1

802

pr.total = efiles

802

pr.total = efiles

803

source.callback = None

803

source.callback = None

804

805

newrevs, newfiles = addchangegroupfiles(repo, source, revmap, trp, pr,

805

newrevs, newfiles = addchangegroupfiles(repo, source, revmap, trp, pr,

806

needfiles)

806

needfiles)

807

revisions += newrevs

807

revisions += newrevs

808

files += newfiles

808

files += newfiles

809

810

dh = 0

810

dh = 0

811

if oldheads:

811

if oldheads:

812

heads = cl.heads()

812

heads = cl.heads()

813

dh = len(heads) - len(oldheads)

813

dh = len(heads) - len(oldheads)

814

for h in heads:

814

for h in heads:

815

if h not in oldheads and repo[h].closesbranch():

815

if h not in oldheads and repo[h].closesbranch():

816

dh -= 1

816

dh -= 1

817

htext = ""

817

htext = ""

818

if dh:

818

if dh:

819

htext = _(" (%+d heads)") % dh

819

htext = _(" (%+d heads)") % dh

820

821

repo.ui.status(_("added %d changesets"

821

repo.ui.status(_("added %d changesets"

822

" with %d changes to %d files%s\n")

822

" with %d changes to %d files%s\n")

823

% (changesets, revisions, files, htext))

823

% (changesets, revisions, files, htext))

824

repo.invalidatevolatilesets()

824

repo.invalidatevolatilesets()

825

826

if changesets > 0:

826

if changesets > 0:

827

p = lambda: tr.writepending() and repo.root or ""

827

p = lambda: tr.writepending() and repo.root or ""

828

if 'node' not in tr.hookargs:

828

if 'node' not in tr.hookargs:

829

tr.hookargs['node'] = hex(cl.node(clstart))

829

tr.hookargs['node'] = hex(cl.node(clstart))

830

hookargs = dict(tr.hookargs)

830

hookargs = dict(tr.hookargs)

831

else:

831

else:

832

hookargs = dict(tr.hookargs)

832

hookargs = dict(tr.hookargs)

833

hookargs['node'] = hex(cl.node(clstart))

833

hookargs['node'] = hex(cl.node(clstart))

834

repo.hook('pretxnchangegroup', throw=True, pending=p, **hookargs)

834

repo.hook('pretxnchangegroup', throw=True, pending=p, **hookargs)

835

836

added = [cl.node(r) for r in xrange(clstart, clend)]

836

added = [cl.node(r) for r in xrange(clstart, clend)]

837

publishing = repo.ui.configbool('phases', 'publish', True)

837

publishing = repo.ui.configbool('phases', 'publish', True)

838

if srctype in ('push', 'serve'):

838

if srctype in ('push', 'serve'):

839

# Old servers can not push the boundary themselves.

839

# Old servers can not push the boundary themselves.

840

# New servers won't push the boundary if changeset already

840

# New servers won't push the boundary if changeset already

841

# exists locally as secret

841

# exists locally as secret

842

#

842

#

843

# We should not use added here but the list of all change in

843

# We should not use added here but the list of all change in

844

# the bundle

844

# the bundle

845

if publishing:

845

if publishing:

846

phases.advanceboundary(repo, tr, phases.public, srccontent)

846

phases.advanceboundary(repo, tr, phases.public, srccontent)

847

else:

847

else:

848

# Those changesets have been pushed from the outside, their

848

# Those changesets have been pushed from the outside, their

849

# phases are going to be pushed alongside. Therefor

849

# phases are going to be pushed alongside. Therefor

850

# `targetphase` is ignored.

850

# `targetphase` is ignored.

851

phases.advanceboundary(repo, tr, phases.draft, srccontent)

851

phases.advanceboundary(repo, tr, phases.draft, srccontent)

852

phases.retractboundary(repo, tr, phases.draft, added)

852

phases.retractboundary(repo, tr, phases.draft, added)

853

elif srctype != 'strip':

853

elif srctype != 'strip':

854

# publishing only alter behavior during push

854

# publishing only alter behavior during push

855

#

855

#

856

# strip should not touch boundary at all

856

# strip should not touch boundary at all

857

phases.retractboundary(repo, tr, targetphase, added)

857

phases.retractboundary(repo, tr, targetphase, added)

858

859

if changesets > 0:

859

if changesets > 0:

860

if srctype != 'strip':

860

if srctype != 'strip':

861

# During strip, branchcache is invalid but coming call to

861

# During strip, branchcache is invalid but coming call to

862

# `destroyed` will repair it.

862

# `destroyed` will repair it.

863

# In other case we can safely update cache on disk.

863

# In other case we can safely update cache on disk.

864

branchmap.updatecache(repo.filtered('served'))

864

branchmap.updatecache(repo.filtered('served'))

865

866

def runhooks():

866

def runhooks():

867

# These hooks run when the lock releases, not when the

867

# These hooks run when the lock releases, not when the

868

# transaction closes. So it's possible for the changelog

868

# transaction closes. So it's possible for the changelog

869

# to have changed since we last saw it.

869

# to have changed since we last saw it.

870

if clstart >= len(repo):

870

if clstart >= len(repo):

871

return

871

return

872

873

# forcefully update the on-disk branch cache

873

# forcefully update the on-disk branch cache

874

repo.ui.debug("updating the branch cache\n")

874

repo.ui.debug("updating the branch cache\n")

875

repo.hook("changegroup", **hookargs)

875

repo.hook("changegroup", **hookargs)

876

877

for n in added:

877

for n in added:

878

args = hookargs.copy()

878

args = hookargs.copy()

879

args['node'] = hex(n)

879

args['node'] = hex(n)

880

repo.hook("incoming", **args)

880

repo.hook("incoming", **args)

881

882

newheads = [h for h in repo.heads() if h not in oldheads]

882

newheads = [h for h in repo.heads() if h not in oldheads]

883

repo.ui.log("incoming",

883

repo.ui.log("incoming",

884

"%s incoming changes - new heads: %s\n",

884

"%s incoming changes - new heads: %s\n",

885

len(added),

885

len(added),

886

', '.join([hex(c[:6]) for c in newheads]))

886

', '.join([hex(c[:6]) for c in newheads]))

887

888

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

888

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

889

lambda tr: repo._afterlock(runhooks))

889

lambda tr: repo._afterlock(runhooks))

890

891

tr.close()

891

tr.close()

892

893

finally:

893

finally:

894

tr.release()

894

tr.release()

895

repo.ui.flush()

895

repo.ui.flush()

896

# never return 0 here:

896

# never return 0 here:

897

if dh < 0:

897

if dh < 0:

898

return dh - 1

898

return dh - 1

899

else:

899

else:

900

return dh + 1

900

return dh + 1

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import weakref
             from i18n import _
             from node import nullrev, nullid, hex, short
             import mdiff, util, dagutil
             import struct, os, bz2, zlib, tempfile
             import discovery, error, phases, branchmap
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise util.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise util.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             class nocompress(object):
                 def compress(self, x):
                     return x
                 def flush(self):
                     return ""
             bundletypes = {
                 "": ("", nocompress), # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", nocompress),
                 "HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),
                 "HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writebundle(ui, cg, filename, bundletype, vfs=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     if bundletype == "HG20":
                         import bundle2
                         bundle = bundle2.bundle20(ui)
                         part = bundle.newpart('changegroup', data=cg.getchunks())
                         part.addparam('version', cg.version)
                         z = nocompress()
                         chunkiter = bundle.getchunks()
                     else:
                         if cg.version != '01':
                             raise util.Abort(_('old bundle types only supports v1 '
                                                'changegroups'))
                         header, compressor = bundletypes[bundletype]
                         fh.write(header)
                         z = compressor()
                         chunkiter = cg.getchunks()
                     # parse the changegroup data, otherwise we will block
                     # in case of sshrepo because we don't know the end of the stream
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, an empty chunkgroup is the end of the changegroup
                     for chunk in chunkiter:
                         fh.write(z.compress(chunk))
                     fh.write(z.flush())
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def decompressor(fh, alg):
                 if alg == 'UN':
                     return fh
                 elif alg == 'GZ':
                     def generator(f):
                         zd = zlib.decompressobj()
                         for chunk in util.filechunkiter(f):
                             yield zd.decompress(chunk)
                 elif alg == 'BZ':
                     def generator(f):
                         zd = bz2.BZ2Decompressor()
                         zd.decompress("BZ")
                         for chunk in util.filechunkiter(f, 4096):
                             yield zd.decompress(chunk)
                 else:
                     raise util.Abort("unknown bundle compression '%s'" % alg)
                 return util.chunkbuffer(generator(fh))
             class cg1unpacker(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 def __init__(self, fh, alg):
                     self._stream = decompressor(fh, alg)
                     self._type = alg
                     self.callback = None
                 def compressed(self):
                     return self._type != 'UN'
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise util.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self.chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     return node, p1, p2, deltabase, cs
                 def deltachunk(self, prevnode):
                     l = self.chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, an empty chunkgroup is the end of the changegroup
                     empty = False
                     count = 0
                     while not empty or count <= 2:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
             class cg2unpacker(cg1unpacker):
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     return node, p1, p2, deltabase, cs
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     self._changelog = repo.changelog
                     self._manifest = repo.manifest
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None, reorder=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and reorder is not False) or reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = self._changelog
                     mf = self._manifest
                     reorder = self._reorder
                     progress = self._progress
                     # for progress output
                     msgbundling = _('bundling')
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     changedfiles = set()
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         changedfiles.update(c[3])
                         # record the first changeset introducing this manifest version
                         mfs.setdefault(c[0], x)
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets'),
                                             reorder=reorder):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     progress(msgbundling, None)
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def lookupmf(x):
                         clnode = mfs[x]
                         if not fastpathlinkrev or reorder:
                             mdata = mf.readfast(x)
                             for f, n in mdata.iteritems():
                                 if f in changedfiles:
                                     # record the first changeset introducing this filelog
                                     # version
                                     fclnodes = fnodes.setdefault(f, {})
                                     fclnode = fclnodes.setdefault(n, clnode)
                                     if clrevorder[clnode] < clrevorder[fclnode]:
                                         fclnodes[n] = clnode
                         return clnode
                     mfnodes = self.prune(mf, mfs, commonrevs)
                     size = 0
                     for chunk in self.group(mfnodes, mf, lookupmf, units=_('manifests'),
                                             reorder=reorder):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                     progress(msgbundling, None)
                     mfs.clear()
-                    needed = set(cl.rev(x) for x in clnodes)
+                    clrevs = set(cl.rev(x) for x in clnodes)
                     def linknodes(filerevlog, fname):
                         if fastpathlinkrev and not reorder:
                             llr = filerevlog.linkrev
                             def genfilenodes():
                                 for r in filerevlog:
                                     linkrev = llr(r)
-                                    if linkrev in needed:
+                                    if linkrev in clrevs:
                                         yield filerevlog.node(r), cl.node(linkrev)
                             return dict(genfilenodes())
                         return fnodes.get(fname, {})
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     progress(msgbundling, None)
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     reorder = self._reorder
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise util.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog,
                                                     reorder=reorder):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError, e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def group(self, nodelist, revlog, lookup, units=None, reorder=None):
                     if (revlog._generaldelta and reorder is not True):
                         reorder = False
                     return super(cg2packer, self).group(nodelist, revlog, lookup,
                                                         units=units, reorder=reorder)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode):
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             packermap = {'01': (cg1packer, cg1unpacker),
                          '02': (cg2packer, cg2unpacker)}
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False, version='01'):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return packermap[version][1](util.chunkbuffer(gengroup), 'UN')
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = packermap[version][0](repo)
                 return getsubset(repo, outgoing, bundler, source, version=version)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = packermap[version][0](repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = cg1packer(repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def _computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroupraw(repo, source, heads=None, common=None, bundlecaps=None,
                                   version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 If version is None, use a version '1' changegroup.
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works. Returns a raw changegroup generator.
                 """
                 outgoing = _computeoutgoing(repo, heads, common)
                 return getlocalchangegroupraw(repo, source, outgoing, bundlecaps=bundlecaps,
                                               version=version)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = _computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise util.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError, e:
                         raise util.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise util.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise util.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files
             def addchangegroup(repo, source, srctype, url, emptyok=False,
                                targetphase=phases.draft):
                 """Add the changegroup returned by source.read() to this repo.
                 srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                 the URL of the repo where this changegroup is coming from.
                 Return an integer summarizing the change to this repo:
                 - nothing changed or no source: 0
                 - more heads than before: 1+added heads (2..n)
                 - fewer heads than before: -1-removed heads (-2..-n)
                 - number of heads stays the same: 1
                 """
                 repo = repo.unfiltered()
                 def csmap(x):
                     repo.ui.debug("add changeset %s\n" % short(x))
                     return len(cl)
                 def revmap(x):
                     return cl.rev(x)
                 if not source:
                     return 0
                 changesets = files = revisions = 0
                 efiles = set()
                 tr = repo.transaction("\n".join([srctype, util.hidepassword(url)]))
                 # The transaction could have been created before and already carries source
                 # information. In this case we use the top level data. We overwrite the
                 # argument because we need to use the top level value (if they exist) in
                 # this function.
                 srctype = tr.hookargs.setdefault('source', srctype)
                 url = tr.hookargs.setdefault('url', url)
                 # write changelog data to temp files so concurrent readers will not see
                 # inconsistent view
                 cl = repo.changelog
                 cl.delayupdate(tr)
                 oldheads = cl.heads()
                 try:
                     repo.hook('prechangegroup', throw=True, **tr.hookargs)
                     trp = weakref.proxy(tr)
                     # pull off the changeset group
                     repo.ui.status(_("adding changesets\n"))
                     clstart = len(cl)
                     class prog(object):
                         step = _('changesets')
                         count = 1
                         ui = repo.ui
                         total = None
                         def __call__(repo):
                             repo.ui.progress(repo.step, repo.count, unit=_('chunks'),
                                              total=repo.total)
                             repo.count += 1
                     pr = prog()
                     source.callback = pr
                     source.changelogheader()
                     srccontent = cl.addgroup(source, csmap, trp)
                     if not (srccontent or emptyok):
                         raise util.Abort(_("received changelog group is empty"))
                     clend = len(cl)
                     changesets = clend - clstart
                     for c in xrange(clstart, clend):
                         efiles.update(repo[c].files())
                     efiles = len(efiles)
                     repo.ui.progress(_('changesets'), None)
                     # pull off the manifest group
                     repo.ui.status(_("adding manifests\n"))
                     pr.step = _('manifests')
                     pr.count = 1
                     pr.total = changesets # manifests <= changesets
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     source.manifestheader()
                     repo.manifest.addgroup(source, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                     needfiles = {}
                     if repo.ui.configbool('server', 'validate', default=False):
                         # validate incoming csets have their manifests
                         for cset in xrange(clstart, clend):
                             mfest = repo.changelog.read(repo.changelog.node(cset))[0]
                             mfest = repo.manifest.readdelta(mfest)
                             # store file nodes we must see
                             for f, n in mfest.iteritems():
                                 needfiles.setdefault(f, set()).add(n)
                     # process the files
                     repo.ui.status(_("adding file changes\n"))
                     pr.step = _('files')
                     pr.count = 1
                     pr.total = efiles
                     source.callback = None
                     newrevs, newfiles = addchangegroupfiles(repo, source, revmap, trp, pr,
                                                             needfiles)
                     revisions += newrevs
                     files += newfiles
                     dh = 0
                     if oldheads:
                         heads = cl.heads()
                         dh = len(heads) - len(oldheads)
                         for h in heads:
                             if h not in oldheads and repo[h].closesbranch():
                                 dh -= 1
                     htext = ""
                     if dh:
                         htext = _(" (%+d heads)") % dh
                     repo.ui.status(_("added %d changesets"
                                      " with %d changes to %d files%s\n")
                                      % (changesets, revisions, files, htext))
                     repo.invalidatevolatilesets()
                     if changesets > 0:
                         p = lambda: tr.writepending() and repo.root or ""
                         if 'node' not in tr.hookargs:
                             tr.hookargs['node'] = hex(cl.node(clstart))
                             hookargs = dict(tr.hookargs)
                         else:
                             hookargs = dict(tr.hookargs)
                             hookargs['node'] = hex(cl.node(clstart))
                         repo.hook('pretxnchangegroup', throw=True, pending=p, **hookargs)
                     added = [cl.node(r) for r in xrange(clstart, clend)]
                     publishing = repo.ui.configbool('phases', 'publish', True)
                     if srctype in ('push', 'serve'):
                         # Old servers can not push the boundary themselves.
                         # New servers won't push the boundary if changeset already
                         # exists locally as secret
                         #
                         # We should not use added here but the list of all change in
                         # the bundle
                         if publishing:
                             phases.advanceboundary(repo, tr, phases.public, srccontent)
                         else:
                             # Those changesets have been pushed from the outside, their
                             # phases are going to be pushed alongside. Therefor
                             # `targetphase` is ignored.
                             phases.advanceboundary(repo, tr, phases.draft, srccontent)
                             phases.retractboundary(repo, tr, phases.draft, added)
                     elif srctype != 'strip':
                         # publishing only alter behavior during push
                         #
                         # strip should not touch boundary at all
                         phases.retractboundary(repo, tr, targetphase, added)
                     if changesets > 0:
                         if srctype != 'strip':
                             # During strip, branchcache is invalid but coming call to
                             # `destroyed` will repair it.
                             # In other case we can safely update cache on disk.
                             branchmap.updatecache(repo.filtered('served'))
                         def runhooks():
                             # These hooks run when the lock releases, not when the
                             # transaction closes. So it's possible for the changelog
                             # to have changed since we last saw it.
                             if clstart >= len(repo):
                                 return
                             # forcefully update the on-disk branch cache
                             repo.ui.debug("updating the branch cache\n")
                             repo.hook("changegroup", **hookargs)
                             for n in added:
                                 args = hookargs.copy()
                                 args['node'] = hex(n)
                                 repo.hook("incoming", **args)
                             newheads = [h for h in repo.heads() if h not in oldheads]
                             repo.ui.log("incoming",
                                         "%s incoming changes - new heads: %s\n",
                                         len(added),
                                         ', '.join([hex(c[:6]) for c in newheads]))
                         tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                         lambda tr: repo._afterlock(runhooks))
                     tr.close()
                 finally:
                     tr.release()
                     repo.ui.flush()
                 # never return 0 here:
                 if dh < 0:
                     return dh - 1
                 else:
                     return dh + 1