upstream/mercurial-mirror Commit - r28230:0c2a088f

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import tempfile

12

import tempfile

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

hex,

17

hex,

18

nullid,

18

nullid,

19

nullrev,

19

nullrev,

20

short,

20

short,

21

)

21

)

22

23

from . import (

23

from . import (

24

branchmap,

24

branchmap,

25

dagutil,

25

dagutil,

26

discovery,

26

discovery,

27

error,

27

error,

28

mdiff,

28

mdiff,

29

phases,

29

phases,

30

util,

30

util,

31

)

31

)

32

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

35

_CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"

35

_CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"

36

37

def readexactly(stream, n):

37

def readexactly(stream, n):

38

'''read n bytes from stream.read and abort if less was available'''

38

'''read n bytes from stream.read and abort if less was available'''

39

s = stream.read(n)

39

s = stream.read(n)

40

if len(s) < n:

40

if len(s) < n:

41

raise error.Abort(_("stream ended unexpectedly"

41

raise error.Abort(_("stream ended unexpectedly"

42

" (got %d bytes, expected %d)")

42

" (got %d bytes, expected %d)")

43

% (len(s), n))

43

% (len(s), n))

44

return s

44

return s

45

46

def getchunk(stream):

46

def getchunk(stream):

47

"""return the next chunk from stream as a string"""

47

"""return the next chunk from stream as a string"""

48

d = readexactly(stream, 4)

48

d = readexactly(stream, 4)

49

l = struct.unpack(">l", d)[0]

49

l = struct.unpack(">l", d)[0]

50

if l <= 4:

50

if l <= 4:

51

if l:

51

if l:

52

raise error.Abort(_("invalid chunk length %d") % l)

52

raise error.Abort(_("invalid chunk length %d") % l)

53

return ""

53

return ""

54

return readexactly(stream, l - 4)

54

return readexactly(stream, l - 4)

55

56

def chunkheader(length):

56

def chunkheader(length):

57

"""return a changegroup chunk header (string)"""

57

"""return a changegroup chunk header (string)"""

58

return struct.pack(">l", length + 4)

58

return struct.pack(">l", length + 4)

59

60

def closechunk():

60

def closechunk():

61

"""return a changegroup chunk header (string) for a zero-length chunk"""

61

"""return a changegroup chunk header (string) for a zero-length chunk"""

62

return struct.pack(">l", 0)

62

return struct.pack(">l", 0)

63

64

def combineresults(results):

64

def combineresults(results):

65

"""logic to combine 0 or more addchangegroup results into one"""

65

"""logic to combine 0 or more addchangegroup results into one"""

66

changedheads = 0

66

changedheads = 0

67

result = 1

67

result = 1

68

for ret in results:

68

for ret in results:

69

# If any changegroup result is 0, return 0

69

# If any changegroup result is 0, return 0

70

if ret == 0:

70

if ret == 0:

71

result = 0

71

result = 0

72

break

72

break

73

if ret < -1:

73

if ret < -1:

74

changedheads += ret + 1

74

changedheads += ret + 1

75

elif ret > 1:

75

elif ret > 1:

76

changedheads += ret - 1

76

changedheads += ret - 1

77

if changedheads > 0:

77

if changedheads > 0:

78

result = 1 + changedheads

78

result = 1 + changedheads

79

elif changedheads < 0:

79

elif changedheads < 0:

80

result = -1 + changedheads

80

result = -1 + changedheads

81

return result

81

return result

82

83

bundletypes = {

83

bundletypes = {

84

"": ("", None), # only when using unbundle on ssh and old http servers

84

"": ("", None), # only when using unbundle on ssh and old http servers

85

# since the unification ssh accepts a header but there

85

# since the unification ssh accepts a header but there

86

# is no capability signaling it.

86

# is no capability signaling it.

87

"HG20": (), # special-cased below

87

"HG20": (), # special-cased below

88

"HG10UN": ("HG10UN", None),

88

"HG10UN": ("HG10UN", None),

89

"HG10BZ": ("HG10", 'BZ'),

89

"HG10BZ": ("HG10", 'BZ'),

90

"HG10GZ": ("HG10GZ", 'GZ'),

90

"HG10GZ": ("HG10GZ", 'GZ'),

91

}

91

}

92

93

# hgweb uses this list to communicate its preferred type

93

# hgweb uses this list to communicate its preferred type

94

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

94

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

95

96

def writechunks(ui, chunks, filename, vfs=None):

96

def writechunks(ui, chunks, filename, vfs=None):

97

"""Write chunks to a file and return its filename.

97

"""Write chunks to a file and return its filename.

98

99

The stream is assumed to be a bundle file.

99

The stream is assumed to be a bundle file.

100

Existing files will not be overwritten.

100

Existing files will not be overwritten.

101

If no filename is specified, a temporary file is created.

101

If no filename is specified, a temporary file is created.

102

"""

102

"""

103

fh = None

103

fh = None

104

cleanup = None

104

cleanup = None

105

try:

105

try:

106

if filename:

106

if filename:

107

if vfs:

107

if vfs:

108

fh = vfs.open(filename, "wb")

108

fh = vfs.open(filename, "wb")

109

else:

109

else:

110

fh = open(filename, "wb")

110

fh = open(filename, "wb")

111

else:

111

else:

112

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

112

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

113

fh = os.fdopen(fd, "wb")

113

fh = os.fdopen(fd, "wb")

114

cleanup = filename

114

cleanup = filename

115

for c in chunks:

115

for c in chunks:

116

fh.write(c)

116

fh.write(c)

117

cleanup = None

117

cleanup = None

118

return filename

118

return filename

119

finally:

119

finally:

120

if fh is not None:

120

if fh is not None:

121

fh.close()

121

fh.close()

122

if cleanup is not None:

122

if cleanup is not None:

123

if filename and vfs:

123

if filename and vfs:

124

vfs.unlink(cleanup)

124

vfs.unlink(cleanup)

125

else:

125

else:

126

os.unlink(cleanup)

126

os.unlink(cleanup)

127

128

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

128

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

129

"""Write a bundle file and return its filename.

129

"""Write a bundle file and return its filename.

130

131

Existing files will not be overwritten.

131

Existing files will not be overwritten.

132

If no filename is specified, a temporary file is created.

132

If no filename is specified, a temporary file is created.

133

bz2 compression can be turned off.

133

bz2 compression can be turned off.

134

The bundle file will be deleted in case of errors.

134

The bundle file will be deleted in case of errors.

135

"""

135

"""

136

137

if bundletype == "HG20":

137

if bundletype == "HG20":

138

from . import bundle2

138

from . import bundle2

139

bundle = bundle2.bundle20(ui)

139

bundle = bundle2.bundle20(ui)

140

bundle.setcompression(compression)

140

bundle.setcompression(compression)

141

part = bundle.newpart('changegroup', data=cg.getchunks())

141

part = bundle.newpart('changegroup', data=cg.getchunks())

142

part.addparam('version', cg.version)

142

part.addparam('version', cg.version)

143

chunkiter = bundle.getchunks()

143

chunkiter = bundle.getchunks()

144

else:

144

else:

145

# compression argument is only for the bundle2 case

145

# compression argument is only for the bundle2 case

146

assert compression is None

146

assert compression is None

147

if cg.version != '01':

147

if cg.version != '01':

148

raise error.Abort(_('old bundle types only supports v1 '

148

raise error.Abort(_('old bundle types only supports v1 '

149

'changegroups'))

149

'changegroups'))

150

header, comp = bundletypes[bundletype]

150

header, comp = bundletypes[bundletype]

151

if comp not in util.compressors:

151

if comp not in util.compressors:

152

raise error.Abort(_('unknown stream compression type: %s')

152

raise error.Abort(_('unknown stream compression type: %s')

153

% comp)

153

% comp)

154

z = util.compressors[comp]()

154

z = util.compressors[comp]()

155

subchunkiter = cg.getchunks()

155

subchunkiter = cg.getchunks()

156

def chunkiter():

156

def chunkiter():

157

yield header

157

yield header

158

for chunk in subchunkiter:

158

for chunk in subchunkiter:

159

yield z.compress(chunk)

159

yield z.compress(chunk)

160

yield z.flush()

160

yield z.flush()

161

chunkiter = chunkiter()

161

chunkiter = chunkiter()

162

163

# parse the changegroup data, otherwise we will block

163

# parse the changegroup data, otherwise we will block

164

# in case of sshrepo because we don't know the end of the stream

164

# in case of sshrepo because we don't know the end of the stream

165

166

# an empty chunkgroup is the end of the changegroup

166

# an empty chunkgroup is the end of the changegroup

167

# a changegroup has at least 2 chunkgroups (changelog and manifest).

167

# a changegroup has at least 2 chunkgroups (changelog and manifest).

168

# after that, an empty chunkgroup is the end of the changegroup

168

# after that, an empty chunkgroup is the end of the changegroup

169

return writechunks(ui, chunkiter, filename, vfs=vfs)

169

return writechunks(ui, chunkiter, filename, vfs=vfs)

170

171

class cg1unpacker(object):

171

class cg1unpacker(object):

172

"""Unpacker for cg1 changegroup streams.

172

"""Unpacker for cg1 changegroup streams.

173

174

A changegroup unpacker handles the framing of the revision data in

174

A changegroup unpacker handles the framing of the revision data in

175

the wire format. Most consumers will want to use the apply()

175

the wire format. Most consumers will want to use the apply()

176

method to add the changes from the changegroup to a repository.

176

method to add the changes from the changegroup to a repository.

177

178

If you're forwarding a changegroup unmodified to another consumer,

178

If you're forwarding a changegroup unmodified to another consumer,

179

use getchunks(), which returns an iterator of changegroup

179

use getchunks(), which returns an iterator of changegroup

180

chunks. This is mostly useful for cases where you need to know the

180

chunks. This is mostly useful for cases where you need to know the

181

data stream has ended by observing the end of the changegroup.

181

data stream has ended by observing the end of the changegroup.

182

183

deltachunk() is useful only if you're applying delta data. Most

183

deltachunk() is useful only if you're applying delta data. Most

184

consumers should prefer apply() instead.

184

consumers should prefer apply() instead.

185

186

A few other public methods exist. Those are used only for

186

A few other public methods exist. Those are used only for

187

bundlerepo and some debug commands - their use is discouraged.

187

bundlerepo and some debug commands - their use is discouraged.

188

"""

188

"""

189

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

189

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

190

deltaheadersize = struct.calcsize(deltaheader)

190

deltaheadersize = struct.calcsize(deltaheader)

191

version = '01'

191

version = '01'

192

_grouplistcount = 1 # One list of files after the manifests

192

_grouplistcount = 1 # One list of files after the manifests

193

194

def __init__(self, fh, alg):

194

def __init__(self, fh, alg):

195

if alg == 'UN':

195

if alg == 'UN':

196

alg = None # get more modern without breaking too much

196

alg = None # get more modern without breaking too much

197

if not alg in util.decompressors:

197

if not alg in util.decompressors:

198

raise error.Abort(_('unknown stream compression type: %s')

198

raise error.Abort(_('unknown stream compression type: %s')

199

% alg)

199

% alg)

200

if alg == 'BZ':

200

if alg == 'BZ':

201

alg = '_truncatedBZ'

201

alg = '_truncatedBZ'

202

self._stream = util.decompressors[alg](fh)

202

self._stream = util.decompressors[alg](fh)

203

self._type = alg

203

self._type = alg

204

self.callback = None

204

self.callback = None

205

206

# These methods (compressed, read, seek, tell) all appear to only

206

# These methods (compressed, read, seek, tell) all appear to only

207

# be used by bundlerepo, but it's a little hard to tell.

207

# be used by bundlerepo, but it's a little hard to tell.

208

def compressed(self):

208

def compressed(self):

209

return self._type is not None

209

return self._type is not None

210

def read(self, l):

210

def read(self, l):

211

return self._stream.read(l)

211

return self._stream.read(l)

212

def seek(self, pos):

212

def seek(self, pos):

213

return self._stream.seek(pos)

213

return self._stream.seek(pos)

214

def tell(self):

214

def tell(self):

215

return self._stream.tell()

215

return self._stream.tell()

216

def close(self):

216

def close(self):

217

return self._stream.close()

217

return self._stream.close()

218

219

def _chunklength(self):

219

def _chunklength(self):

220

d = readexactly(self._stream, 4)

220

d = readexactly(self._stream, 4)

221

l = struct.unpack(">l", d)[0]

221

l = struct.unpack(">l", d)[0]

222

if l <= 4:

222

if l <= 4:

223

if l:

223

if l:

224

raise error.Abort(_("invalid chunk length %d") % l)

224

raise error.Abort(_("invalid chunk length %d") % l)

225

return 0

225

return 0

226

if self.callback:

226

if self.callback:

227

self.callback()

227

self.callback()

228

return l - 4

228

return l - 4

229

230

def changelogheader(self):

230

def changelogheader(self):

231

"""v10 does not have a changelog header chunk"""

231

"""v10 does not have a changelog header chunk"""

232

return {}

232

return {}

233

234

def manifestheader(self):

234

def manifestheader(self):

235

"""v10 does not have a manifest header chunk"""

235

"""v10 does not have a manifest header chunk"""

236

return {}

236

return {}

237

238

def filelogheader(self):

238

def filelogheader(self):

239

"""return the header of the filelogs chunk, v10 only has the filename"""

239

"""return the header of the filelogs chunk, v10 only has the filename"""

240

l = self._chunklength()

240

l = self._chunklength()

241

if not l:

241

if not l:

242

return {}

242

return {}

243

fname = readexactly(self._stream, l)

243

fname = readexactly(self._stream, l)

244

return {'filename': fname}

244

return {'filename': fname}

245

246

def _deltaheader(self, headertuple, prevnode):

246

def _deltaheader(self, headertuple, prevnode):

247

node, p1, p2, cs = headertuple

247

node, p1, p2, cs = headertuple

248

if prevnode is None:

248

if prevnode is None:

249

deltabase = p1

249

deltabase = p1

250

else:

250

else:

251

deltabase = prevnode

251

deltabase = prevnode

252

flags = 0

252

flags = 0

253

return node, p1, p2, deltabase, cs, flags

253

return node, p1, p2, deltabase, cs, flags

254

255

def deltachunk(self, prevnode):

255

def deltachunk(self, prevnode):

256

l = self._chunklength()

256

l = self._chunklength()

257

if not l:

257

if not l:

258

return {}

258

return {}

259

headerdata = readexactly(self._stream, self.deltaheadersize)

259

headerdata = readexactly(self._stream, self.deltaheadersize)

260

header = struct.unpack(self.deltaheader, headerdata)

260

header = struct.unpack(self.deltaheader, headerdata)

261

delta = readexactly(self._stream, l - self.deltaheadersize)

261

delta = readexactly(self._stream, l - self.deltaheadersize)

262

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

262

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

263

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

263

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

264

'deltabase': deltabase, 'delta': delta, 'flags': flags}

264

'deltabase': deltabase, 'delta': delta, 'flags': flags}

265

266

def getchunks(self):

266

def getchunks(self):

267

"""returns all the chunks contains in the bundle

267

"""returns all the chunks contains in the bundle

268

269

Used when you need to forward the binary stream to a file or another

269

Used when you need to forward the binary stream to a file or another

270

network API. To do so, it parse the changegroup data, otherwise it will

270

network API. To do so, it parse the changegroup data, otherwise it will

271

block in case of sshrepo because it don't know the end of the stream.

271

block in case of sshrepo because it don't know the end of the stream.

272

"""

272

"""

273

# an empty chunkgroup is the end of the changegroup

273

# an empty chunkgroup is the end of the changegroup

274

# a changegroup has at least 2 chunkgroups (changelog and manifest).

274

# a changegroup has at least 2 chunkgroups (changelog and manifest).

275

# after that, changegroup versions 1 and 2 have a series of groups

275

# after that, changegroup versions 1 and 2 have a series of groups

276

# with one group per file. changegroup 3 has a series of directory

276

# with one group per file. changegroup 3 has a series of directory

277

# manifests before the files.

277

# manifests before the files.

278

count = 0

278

count = 0

279

emptycount = 0

279

emptycount = 0

280

while emptycount < self._grouplistcount:

280

while emptycount < self._grouplistcount:

281

empty = True

281

empty = True

282

count += 1

282

count += 1

283

while True:

283

while True:

284

chunk = getchunk(self)

284

chunk = getchunk(self)

285

if not chunk:

285

if not chunk:

286

if empty and count > 2:

286

if empty and count > 2:

287

emptycount += 1

287

emptycount += 1

288

break

288

break

289

empty = False

289

empty = False

290

yield chunkheader(len(chunk))

290

yield chunkheader(len(chunk))

291

pos = 0

291

pos = 0

292

while pos < len(chunk):

292

while pos < len(chunk):

293

next = pos + 2**20

293

next = pos + 2**20

294

yield chunk[pos:next]

294

yield chunk[pos:next]

295

pos = next

295

pos = next

296

yield closechunk()

296

yield closechunk()

297

298

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

298

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

299

# We know that we'll never have more manifests than we had

299

# We know that we'll never have more manifests than we had

300

# changesets.

300

# changesets.

301

self.callback = prog(_('manifests'), numchanges)

301

self.callback = prog(_('manifests'), numchanges)

302

# no need to check for empty manifest group here:

302

# no need to check for empty manifest group here:

303

# if the result of the merge of 1 and 2 is the same in 3 and 4,

303

# if the result of the merge of 1 and 2 is the same in 3 and 4,

304

# no new manifest will be created and the manifest group will

304

# no new manifest will be created and the manifest group will

305

# be empty during the pull

305

# be empty during the pull

306

self.manifestheader()

306

self.manifestheader()

307

repo.manifest.addgroup(self, revmap, trp)

307

repo.manifest.addgroup(self, revmap, trp)

308

repo.ui.progress(_('manifests'), None)

308

repo.ui.progress(_('manifests'), None)

309

310

def apply(self, repo, srctype, url, emptyok=False,

310

def apply(self, repo, srctype, url, emptyok=False,

311

targetphase=phases.draft, expectedtotal=None):

311

targetphase=phases.draft, expectedtotal=None):

312

"""Add the changegroup returned by source.read() to this repo.

312

"""Add the changegroup returned by source.read() to this repo.

313

srctype is a string like 'push', 'pull', or 'unbundle'. url is

313

srctype is a string like 'push', 'pull', or 'unbundle'. url is

314

the URL of the repo where this changegroup is coming from.

314

the URL of the repo where this changegroup is coming from.

315

316

Return an integer summarizing the change to this repo:

316

Return an integer summarizing the change to this repo:

317

- nothing changed or no source: 0

317

- nothing changed or no source: 0

318

- more heads than before: 1+added heads (2..n)

318

- more heads than before: 1+added heads (2..n)

319

- fewer heads than before: -1-removed heads (-2..-n)

319

- fewer heads than before: -1-removed heads (-2..-n)

320

- number of heads stays the same: 1

320

- number of heads stays the same: 1

321

"""

321

"""

322

repo = repo.unfiltered()

322

repo = repo.unfiltered()

323

def csmap(x):

323

def csmap(x):

324

repo.ui.debug("add changeset %s\n" % short(x))

324

repo.ui.debug("add changeset %s\n" % short(x))

325

return len(cl)

325

return len(cl)

326

327

def revmap(x):

327

def revmap(x):

328

return cl.rev(x)

328

return cl.rev(x)

329

330

changesets = files = revisions = 0

330

changesets = files = revisions = 0

331

332

try:

332

try:

333

with repo.transaction("\n".join([srctype,

333

with repo.transaction("\n".join([srctype,

334

util.hidepassword(url)])) as tr:

334

util.hidepassword(url)])) as tr:

335

# The transaction could have been created before and already

335

# The transaction could have been created before and already

336

# carries source information. In this case we use the top

336

# carries source information. In this case we use the top

337

# level data. We overwrite the argument because we need to use

337

# level data. We overwrite the argument because we need to use

338

# the top level value (if they exist) in this function.

338

# the top level value (if they exist) in this function.

339

srctype = tr.hookargs.setdefault('source', srctype)

339

srctype = tr.hookargs.setdefault('source', srctype)

340

url = tr.hookargs.setdefault('url', url)

340

url = tr.hookargs.setdefault('url', url)

341

repo.hook('prechangegroup', throw=True, **tr.hookargs)

341

repo.hook('prechangegroup', throw=True, **tr.hookargs)

342

343

# write changelog data to temp files so concurrent readers

343

# write changelog data to temp files so concurrent readers

344

# will not see an inconsistent view

344

# will not see an inconsistent view

345

cl = repo.changelog

345

cl = repo.changelog

346

cl.delayupdate(tr)

346

cl.delayupdate(tr)

347

oldheads = cl.heads()

347

oldheads = cl.heads()

348

349

trp = weakref.proxy(tr)

349

trp = weakref.proxy(tr)

350

# pull off the changeset group

350

# pull off the changeset group

351

repo.ui.status(_("adding changesets\n"))

351

repo.ui.status(_("adding changesets\n"))

352

clstart = len(cl)

352

clstart = len(cl)

353

class prog(object):

353

class prog(object):

354

def __init__(self, step, total):

354

def __init__(self, step, total):

355

self._step = step

355

self._step = step

356

self._total = total

356

self._total = total

357

self._count = 1

357

self._count = 1

358

def __call__(self):

358

def __call__(self):

359

repo.ui.progress(self._step, self._count,

359

repo.ui.progress(self._step, self._count,

360

unit=_('chunks'), total=self._total)

360

unit=_('chunks'), total=self._total)

361

self._count += 1

361

self._count += 1

362

self.callback = prog(_('changesets'), expectedtotal)

362

self.callback = prog(_('changesets'), expectedtotal)

363

364

efiles = set()

364

efiles = set()

365

def onchangelog(cl, node):

365

def onchangelog(cl, node):

366

efiles.update(cl.read(node)[3])

366

efiles.update(cl.read(node)[3])

367

368

self.changelogheader()

368

self.changelogheader()

369

srccontent = cl.addgroup(self, csmap, trp,

369

srccontent = cl.addgroup(self, csmap, trp,

370

addrevisioncb=onchangelog)

370

addrevisioncb=onchangelog)

371

efiles = len(efiles)

371

efiles = len(efiles)

372

373

if not (srccontent or emptyok):

373

if not (srccontent or emptyok):

374

raise error.Abort(_("received changelog group is empty"))

374

raise error.Abort(_("received changelog group is empty"))

375

clend = len(cl)

375

clend = len(cl)

376

changesets = clend - clstart

376

changesets = clend - clstart

377

repo.ui.progress(_('changesets'), None)

377

repo.ui.progress(_('changesets'), None)

378

379

# pull off the manifest group

379

# pull off the manifest group

380

repo.ui.status(_("adding manifests\n"))

380

repo.ui.status(_("adding manifests\n"))

381

self._unpackmanifests(repo, revmap, trp, prog, changesets)

381

self._unpackmanifests(repo, revmap, trp, prog, changesets)

382

383

needfiles = {}

383

needfiles = {}

384

if repo.ui.configbool('server', 'validate', default=False):

384

if repo.ui.configbool('server', 'validate', default=False):

385

# validate incoming csets have their manifests

385

# validate incoming csets have their manifests

386

for cset in xrange(clstart, clend):

386

for cset in xrange(clstart, clend):

387

mfnode = repo.changelog.read(

387

mfnode = repo.changelog.read(

388

repo.changelog.node(cset))[0]

388

repo.changelog.node(cset))[0]

389

mfest = repo.manifest.readdelta(mfnode)

389

mfest = repo.manifest.readdelta(mfnode)

390

# store file nodes we must see

390

# store file nodes we must see

391

for f, n in mfest.iteritems():

391

for f, n in mfest.iteritems():

392

needfiles.setdefault(f, set()).add(n)

392

needfiles.setdefault(f, set()).add(n)

393

394

# process the files

394

# process the files

395

repo.ui.status(_("adding file changes\n"))

395

repo.ui.status(_("adding file changes\n"))

396

self.callback = None

396

self.callback = None

397

pr = prog(_('files'), efiles)

397

pr = prog(_('files'), efiles)

398

newrevs, newfiles = _addchangegroupfiles(

398

newrevs, newfiles = _addchangegroupfiles(

399

repo, self, revmap, trp, pr, needfiles)

399

repo, self, revmap, trp, pr, needfiles)

400

revisions += newrevs

400

revisions += newrevs

401

files += newfiles

401

files += newfiles

402

403

dh = 0

403

dh = 0

404

if oldheads:

404

if oldheads:

405

heads = cl.heads()

405

heads = cl.heads()

406

dh = len(heads) - len(oldheads)

406

dh = len(heads) - len(oldheads)

407

for h in heads:

407

for h in heads:

408

if h not in oldheads and repo[h].closesbranch():

408

if h not in oldheads and repo[h].closesbranch():

409

dh -= 1

409

dh -= 1

410

htext = ""

410

htext = ""

411

if dh:

411

if dh:

412

htext = _(" (%+d heads)") % dh

412

htext = _(" (%+d heads)") % dh

413

414

repo.ui.status(_("added %d changesets"

414

repo.ui.status(_("added %d changesets"

415

" with %d changes to %d files%s\n")

415

" with %d changes to %d files%s\n")

416

% (changesets, revisions, files, htext))

416

% (changesets, revisions, files, htext))

417

repo.invalidatevolatilesets()

417

repo.invalidatevolatilesets()

418

419

if changesets > 0:

419

if changesets > 0:

420

if 'node' not in tr.hookargs:

420

if 'node' not in tr.hookargs:

421

tr.hookargs['node'] = hex(cl.node(clstart))

421

tr.hookargs['node'] = hex(cl.node(clstart))

422

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

422

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

423

hookargs = dict(tr.hookargs)

423

hookargs = dict(tr.hookargs)

424

else:

424

else:

425

hookargs = dict(tr.hookargs)

425

hookargs = dict(tr.hookargs)

426

hookargs['node'] = hex(cl.node(clstart))

426

hookargs['node'] = hex(cl.node(clstart))

427

hookargs['node_last'] = hex(cl.node(clend - 1))

427

hookargs['node_last'] = hex(cl.node(clend - 1))

428

repo.hook('pretxnchangegroup', throw=True, **hookargs)

428

repo.hook('pretxnchangegroup', throw=True, **hookargs)

429

430

added = [cl.node(r) for r in xrange(clstart, clend)]

430

added = [cl.node(r) for r in xrange(clstart, clend)]

431

publishing = repo.publishing()

431

publishing = repo.publishing()

432

if srctype in ('push', 'serve'):

432

if srctype in ('push', 'serve'):

433

# Old servers can not push the boundary themselves.

433

# Old servers can not push the boundary themselves.

434

# New servers won't push the boundary if changeset already

434

# New servers won't push the boundary if changeset already

435

# exists locally as secret

435

# exists locally as secret

436

#

436

#

437

# We should not use added here but the list of all change in

437

# We should not use added here but the list of all change in

438

# the bundle

438

# the bundle

439

if publishing:

439

if publishing:

440

phases.advanceboundary(repo, tr, phases.public,

440

phases.advanceboundary(repo, tr, phases.public,

441

srccontent)

441

srccontent)

442

else:

442

else:

443

# Those changesets have been pushed from the

443

# Those changesets have been pushed from the

444

# outside, their phases are going to be pushed

444

# outside, their phases are going to be pushed

445

# alongside. Therefor `targetphase` is

445

# alongside. Therefor `targetphase` is

446

# ignored.

446

# ignored.

447

phases.advanceboundary(repo, tr, phases.draft,

447

phases.advanceboundary(repo, tr, phases.draft,

448

srccontent)

448

srccontent)

449

phases.retractboundary(repo, tr, phases.draft, added)

449

phases.retractboundary(repo, tr, phases.draft, added)

450

elif srctype != 'strip':

450

elif srctype != 'strip':

451

# publishing only alter behavior during push

451

# publishing only alter behavior during push

452

#

452

#

453

# strip should not touch boundary at all

453

# strip should not touch boundary at all

454

phases.retractboundary(repo, tr, targetphase, added)

454

phases.retractboundary(repo, tr, targetphase, added)

455

456

if changesets > 0:

456

if changesets > 0:

457

if srctype != 'strip':

457

if srctype != 'strip':

458

# During strip, branchcache is invalid but

458

# During strip, branchcache is invalid but

459

# coming call to `destroyed` will repair it.

459

# coming call to `destroyed` will repair it.

460

# In other case we can safely update cache on

460

# In other case we can safely update cache on

461

# disk.

461

# disk.

462

branchmap.updatecache(repo.filtered('served'))

462

branchmap.updatecache(repo.filtered('served'))

463

464

def runhooks():

464

def runhooks():

465

# These hooks run when the lock releases, not when the

465

# These hooks run when the lock releases, not when the

466

# transaction closes. So it's possible for the changelog

466

# transaction closes. So it's possible for the changelog

467

# to have changed since we last saw it.

467

# to have changed since we last saw it.

468

if clstart >= len(repo):

468

if clstart >= len(repo):

469

return

469

return

470

471

# forcefully update the on-disk branch cache

471

# forcefully update the on-disk branch cache

472

repo.ui.debug("updating the branch cache\n")

472

repo.ui.debug("updating the branch cache\n")

473

repo.hook("changegroup", **hookargs)

473

repo.hook("changegroup", **hookargs)

474

475

for n in added:

475

for n in added:

476

args = hookargs.copy()

476

args = hookargs.copy()

477

args['node'] = hex(n)

477

args['node'] = hex(n)

478

del args['node_last']

478

del args['node_last']

479

repo.hook("incoming", **args)

479

repo.hook("incoming", **args)

480

481

newheads = [h for h in repo.heads()

481

newheads = [h for h in repo.heads()

482

if h not in oldheads]

482

if h not in oldheads]

483

repo.ui.log("incoming",

483

repo.ui.log("incoming",

484

"%s incoming changes - new heads: %s\n",

484

"%s incoming changes - new heads: %s\n",

485

len(added),

485

len(added),

486

', '.join([hex(c[:6]) for c in newheads]))

486

', '.join([hex(c[:6]) for c in newheads]))

487

488

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

488

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

489

lambda tr: repo._afterlock(runhooks))

489

lambda tr: repo._afterlock(runhooks))

490

finally:

490

finally:

491

repo.ui.flush()

491

repo.ui.flush()

492

# never return 0 here:

492

# never return 0 here:

493

if dh < 0:

493

if dh < 0:

494

return dh - 1

494

return dh - 1

495

else:

495

else:

496

return dh + 1

496

return dh + 1

497

498

class cg2unpacker(cg1unpacker):

498

class cg2unpacker(cg1unpacker):

499

"""Unpacker for cg2 streams.

499

"""Unpacker for cg2 streams.

500

501

cg2 streams add support for generaldelta, so the delta header

501

cg2 streams add support for generaldelta, so the delta header

502

format is slightly different. All other features about the data

502

format is slightly different. All other features about the data

503

remain the same.

503

remain the same.

504

"""

504

"""

505

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

505

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

506

deltaheadersize = struct.calcsize(deltaheader)

506

deltaheadersize = struct.calcsize(deltaheader)

507

version = '02'

507

version = '02'

508

509

def _deltaheader(self, headertuple, prevnode):

509

def _deltaheader(self, headertuple, prevnode):

510

node, p1, p2, deltabase, cs = headertuple

510

node, p1, p2, deltabase, cs = headertuple

511

flags = 0

511

flags = 0

512

return node, p1, p2, deltabase, cs, flags

512

return node, p1, p2, deltabase, cs, flags

513

514

class cg3unpacker(cg2unpacker):

514

class cg3unpacker(cg2unpacker):

515

"""Unpacker for cg3 streams.

515

"""Unpacker for cg3 streams.

516

517

cg3 streams add support for exchanging treemanifests and revlog

517

cg3 streams add support for exchanging treemanifests and revlog

518

flags. It adds the revlog flags to the delta header and an empty chunk

518

flags. It adds the revlog flags to the delta header and an empty chunk

519

separating manifests and files.

519

separating manifests and files.

520

"""

520

"""

521

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

521

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

522

deltaheadersize = struct.calcsize(deltaheader)

522

deltaheadersize = struct.calcsize(deltaheader)

523

version = '03'

523

version = '03'

524

_grouplistcount = 2 # One list of manifests and one list of files

524

_grouplistcount = 2 # One list of manifests and one list of files

525

526

def _deltaheader(self, headertuple, prevnode):

526

def _deltaheader(self, headertuple, prevnode):

527

node, p1, p2, deltabase, cs, flags = headertuple

527

node, p1, p2, deltabase, cs, flags = headertuple

528

return node, p1, p2, deltabase, cs, flags

528

return node, p1, p2, deltabase, cs, flags

529

530

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

530

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

531

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,

531

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,

532

numchanges)

532

numchanges)

533

while True:

533

while True:

534

chunkdata = self.filelogheader()

534

chunkdata = self.filelogheader()

535

if not chunkdata:

535

if not chunkdata:

536

break

536

break

537

# If we get here, there are directory manifests in the changegroup

537

# If we get here, there are directory manifests in the changegroup

538

d = chunkdata["filename"]

538

d = chunkdata["filename"]

539

repo.ui.debug("adding %s revisions\n" % d)

539

repo.ui.debug("adding %s revisions\n" % d)

540

dirlog = repo.manifest.dirlog(d)

540

dirlog = repo.manifest.dirlog(d)

541

if not dirlog.addgroup(self, revmap, trp):

541

if not dirlog.addgroup(self, revmap, trp):

542

raise error.Abort(_("received dir revlog group is empty"))

542

raise error.Abort(_("received dir revlog group is empty"))

543

544

class headerlessfixup(object):

544

class headerlessfixup(object):

545

def __init__(self, fh, h):

545

def __init__(self, fh, h):

546

self._h = h

546

self._h = h

547

self._fh = fh

547

self._fh = fh

548

def read(self, n):

548

def read(self, n):

549

if self._h:

549

if self._h:

550

d, self._h = self._h[:n], self._h[n:]

550

d, self._h = self._h[:n], self._h[n:]

551

if len(d) < n:

551

if len(d) < n:

552

d += readexactly(self._fh, n - len(d))

552

d += readexactly(self._fh, n - len(d))

553

return d

553

return d

554

return readexactly(self._fh, n)

554

return readexactly(self._fh, n)

555

556

def _moddirs(files):

556

def _moddirs(files):

557

"""Given a set of modified files, find the list of modified directories.

557

"""Given a set of modified files, find the list of modified directories.

558

559

This returns a list of (path to changed dir, changed dir) tuples,

559

This returns a list of (path to changed dir, changed dir) tuples,

560

as that's what the one client needs anyway.

560

as that's what the one client needs anyway.

561

562

>>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])

562

>>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])

563

[('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]

563

[('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]

564

565

"""

565

"""

566

alldirs = set()

566

alldirs = set()

567

for f in files:

567

for f in files:

568

path = f.split('/')[:-1]

568

path = f.split('/')[:-1]

569

for i in xrange(len(path) - 1, -1, -1):

569

for i in xrange(len(path) - 1, -1, -1):

570

dn = '/'.join(path[:i])

570

dn = '/'.join(path[:i])

571

current = dn + '/', path[i] + '/'

571

current = dn + '/', path[i] + '/'

572

if current in alldirs:

572

if current in alldirs:

573

break

573

break

574

alldirs.add(current)

574

alldirs.add(current)

575

return sorted(alldirs)

575

return sorted(alldirs)

576

577

class cg1packer(object):

577

class cg1packer(object):

578

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

578

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

579

version = '01'

579

version = '01'

580

def __init__(self, repo, bundlecaps=None):

580

def __init__(self, repo, bundlecaps=None):

581

"""Given a source repo, construct a bundler.

581

"""Given a source repo, construct a bundler.

582

583

bundlecaps is optional and can be used to specify the set of

583

bundlecaps is optional and can be used to specify the set of

584

capabilities which can be used to build the bundle.

584

capabilities which can be used to build the bundle.

585

"""

585

"""

586

# Set of capabilities we can use to build the bundle.

586

# Set of capabilities we can use to build the bundle.

587

if bundlecaps is None:

587

if bundlecaps is None:

588

bundlecaps = set()

588

bundlecaps = set()

589

self._bundlecaps = bundlecaps

589

self._bundlecaps = bundlecaps

590

# experimental config: bundle.reorder

590

# experimental config: bundle.reorder

591

reorder = repo.ui.config('bundle', 'reorder', 'auto')

591

reorder = repo.ui.config('bundle', 'reorder', 'auto')

592

if reorder == 'auto':

592

if reorder == 'auto':

593

reorder = None

593

reorder = None

594

else:

594

else:

595

reorder = util.parsebool(reorder)

595

reorder = util.parsebool(reorder)

596

self._repo = repo

596

self._repo = repo

597

self._reorder = reorder

597

self._reorder = reorder

598

self._progress = repo.ui.progress

598

self._progress = repo.ui.progress

599

if self._repo.ui.verbose and not self._repo.ui.debugflag:

599

if self._repo.ui.verbose and not self._repo.ui.debugflag:

600

self._verbosenote = self._repo.ui.note

600

self._verbosenote = self._repo.ui.note

601

else:

601

else:

602

self._verbosenote = lambda s: None

602

self._verbosenote = lambda s: None

603

604

def close(self):

604

def close(self):

605

return closechunk()

605

return closechunk()

606

607

def fileheader(self, fname):

607

def fileheader(self, fname):

608

return chunkheader(len(fname)) + fname

608

return chunkheader(len(fname)) + fname

609

610

def group(self, nodelist, revlog, lookup, units=None):

610

def group(self, nodelist, revlog, lookup, units=None):

611

"""Calculate a delta group, yielding a sequence of changegroup chunks

611

"""Calculate a delta group, yielding a sequence of changegroup chunks

612

(strings).

612

(strings).

613

614

Given a list of changeset revs, return a set of deltas and

614

Given a list of changeset revs, return a set of deltas and

615

metadata corresponding to nodes. The first delta is

615

metadata corresponding to nodes. The first delta is

616

first parent(nodelist[0]) -> nodelist[0], the receiver is

616

first parent(nodelist[0]) -> nodelist[0], the receiver is

617

guaranteed to have this parent as it has all history before

617

guaranteed to have this parent as it has all history before

618

these changesets. In the case firstparent is nullrev the

618

these changesets. In the case firstparent is nullrev the

619

changegroup starts with a full revision.

619

changegroup starts with a full revision.

620

621

If units is not None, progress detail will be generated, units specifies

621

If units is not None, progress detail will be generated, units specifies

622

the type of revlog that is touched (changelog, manifest, etc.).

622

the type of revlog that is touched (changelog, manifest, etc.).

623

"""

623

"""

624

# if we don't have any revisions touched by these changesets, bail

624

# if we don't have any revisions touched by these changesets, bail

625

if len(nodelist) == 0:

625

if len(nodelist) == 0:

626

yield self.close()

626

yield self.close()

627

return

627

return

628

629

# for generaldelta revlogs, we linearize the revs; this will both be

629

# for generaldelta revlogs, we linearize the revs; this will both be

630

# much quicker and generate a much smaller bundle

630

# much quicker and generate a much smaller bundle

631

if (revlog._generaldelta and self._reorder is None) or self._reorder:

631

if (revlog._generaldelta and self._reorder is None) or self._reorder:

632

dag = dagutil.revlogdag(revlog)

632

dag = dagutil.revlogdag(revlog)

633

revs = set(revlog.rev(n) for n in nodelist)

633

revs = set(revlog.rev(n) for n in nodelist)

634

revs = dag.linearize(revs)

634

revs = dag.linearize(revs)

635

else:

635

else:

636

revs = sorted([revlog.rev(n) for n in nodelist])

636

revs = sorted([revlog.rev(n) for n in nodelist])

637

638

# add the parent of the first rev

638

# add the parent of the first rev

639

p = revlog.parentrevs(revs[0])[0]

639

p = revlog.parentrevs(revs[0])[0]

640

revs.insert(0, p)

640

revs.insert(0, p)

641

642

# build deltas

642

# build deltas

643

total = len(revs) - 1

643

total = len(revs) - 1

644

msgbundling = _('bundling')

644

msgbundling = _('bundling')

645

for r in xrange(len(revs) - 1):

645

for r in xrange(len(revs) - 1):

646

if units is not None:

646

if units is not None:

647

self._progress(msgbundling, r + 1, unit=units, total=total)

647

self._progress(msgbundling, r + 1, unit=units, total=total)

648

prev, curr = revs[r], revs[r + 1]

648

prev, curr = revs[r], revs[r + 1]

649

linknode = lookup(revlog.node(curr))

649

linknode = lookup(revlog.node(curr))

650

for c in self.revchunk(revlog, curr, prev, linknode):

650

for c in self.revchunk(revlog, curr, prev, linknode):

651

yield c

651

yield c

652

653

if units is not None:

653

if units is not None:

654

self._progress(msgbundling, None)

654

self._progress(msgbundling, None)

655

yield self.close()

655

yield self.close()

656

657

# filter any nodes that claim to be part of the known set

657

# filter any nodes that claim to be part of the known set

658

def prune(self, revlog, missing, commonrevs):

658

def prune(self, revlog, missing, commonrevs):

659

rr, rl = revlog.rev, revlog.linkrev

659

rr, rl = revlog.rev, revlog.linkrev

660

return [n for n in missing if rl(rr(n)) not in commonrevs]

660

return [n for n in missing if rl(rr(n)) not in commonrevs]

661

662

def _packmanifests(self, dir, mfnodes, lookuplinknode):

662

def _packmanifests(self, dir, mfnodes, lookuplinknode):

663

"""Pack flat manifests into a changegroup stream."""

663

"""Pack flat manifests into a changegroup stream."""

664

assert not dir

664

assert not dir

665

for chunk in self.group(mfnodes, self._repo.manifest,

665

for chunk in self.group(mfnodes, self._repo.manifest,

666

lookuplinknode, units=_('manifests')):

666

lookuplinknode, units=_('manifests')):

667

yield chunk

667

yield chunk

668

669

def _manifestsdone(self):

669

def _manifestsdone(self):

670

return ''

670

return ''

671

672

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

672

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

673

'''yield a sequence of changegroup chunks (strings)'''

673

'''yield a sequence of changegroup chunks (strings)'''

674

repo = self._repo

674

repo = self._repo

675

cl = repo.changelog

675

cl = repo.changelog

676

677

clrevorder = {}

677

clrevorder = {}

678

mfs = {} # needed manifests

678

mfs = {} # needed manifests

679

fnodes = {} # needed file nodes

679

fnodes = {} # needed file nodes

680

# maps manifest node id -> set(changed files)

680

# maps manifest node id -> set(changed files)

681

mfchangedfiles = {}

681

mfchangedfiles = {}

682

683

# Callback for the changelog, used to collect changed files and manifest

683

# Callback for the changelog, used to collect changed files and manifest

684

# nodes.

684

# nodes.

685

# Returns the linkrev node (identity in the changelog case).

685

# Returns the linkrev node (identity in the changelog case).

686

def lookupcl(x):

686

def lookupcl(x):

687

c = cl.read(x)

687

c = cl.read(x)

688

clrevorder[x] = len(clrevorder)

688

clrevorder[x] = len(clrevorder)

689

n = c[0]

689

n = c[0]

690

# record the first changeset introducing this manifest version

690

# record the first changeset introducing this manifest version

691

mfs.setdefault(n, x)

691

mfs.setdefault(n, x)

692

# Record a complete list of potentially-changed files in

692

# Record a complete list of potentially-changed files in

693

# this manifest.

693

# this manifest.

694

mfchangedfiles.setdefault(n, set()).update(c[3])

694

mfchangedfiles.setdefault(n, set()).update(c[3])

695

return x

695

return x

696

697

self._verbosenote(_('uncompressed size of bundle content:\n'))

697

self._verbosenote(_('uncompressed size of bundle content:\n'))

698

size = 0

698

size = 0

699

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

699

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

700

size += len(chunk)

700

size += len(chunk)

701

yield chunk

701

yield chunk

702

self._verbosenote(_('%8.i (changelog)\n') % size)

702

self._verbosenote(_('%8.i (changelog)\n') % size)

703

704

# We need to make sure that the linkrev in the changegroup refers to

704

# We need to make sure that the linkrev in the changegroup refers to

705

# the first changeset that introduced the manifest or file revision.

705

# the first changeset that introduced the manifest or file revision.

706

# The fastpath is usually safer than the slowpath, because the filelogs

706

# The fastpath is usually safer than the slowpath, because the filelogs

707

# are walked in revlog order.

707

# are walked in revlog order.

708

#

708

#

709

# When taking the slowpath with reorder=None and the manifest revlog

709

# When taking the slowpath with reorder=None and the manifest revlog

710

# uses generaldelta, the manifest may be walked in the "wrong" order.

710

# uses generaldelta, the manifest may be walked in the "wrong" order.

711

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

711

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

712

# cc0ff93d0c0c).

712

# cc0ff93d0c0c).

713

#

713

#

714

# When taking the fastpath, we are only vulnerable to reordering

714

# When taking the fastpath, we are only vulnerable to reordering

715

# of the changelog itself. The changelog never uses generaldelta, so

715

# of the changelog itself. The changelog never uses generaldelta, so

716

# it is only reordered when reorder=True. To handle this case, we

716

# it is only reordered when reorder=True. To handle this case, we

717

# simply take the slowpath, which already has the 'clrevorder' logic.

717

# simply take the slowpath, which already has the 'clrevorder' logic.

718

# This was also fixed in cc0ff93d0c0c.

718

# This was also fixed in cc0ff93d0c0c.

719

fastpathlinkrev = fastpathlinkrev and not self._reorder

719

fastpathlinkrev = fastpathlinkrev and not self._reorder

720

# Treemanifests don't work correctly with fastpathlinkrev

720

# Treemanifests don't work correctly with fastpathlinkrev

721

# either, because we don't discover which directory nodes to

721

# either, because we don't discover which directory nodes to

722

# send along with files. This could probably be fixed.

722

# send along with files. This could probably be fixed.

723

fastpathlinkrev = fastpathlinkrev and (

723

fastpathlinkrev = fastpathlinkrev and (

724

'treemanifest' not in repo.requirements)

724

'treemanifest' not in repo.requirements)

725

726

for chunk in self.generatemanifests(commonrevs, clrevorder,

726

for chunk in self.generatemanifests(commonrevs, clrevorder,

727

fastpathlinkrev, mfs, mfchangedfiles, fnodes):

727

fastpathlinkrev, mfs, mfchangedfiles, fnodes):

728

yield chunk

728

yield chunk

729

mfs.clear()

729

mfs.clear()

730

clrevs = set(cl.rev(x) for x in clnodes)

730

clrevs = set(cl.rev(x) for x in clnodes)

731

732

if not fastpathlinkrev:

732

if not fastpathlinkrev:

733

def linknodes(unused, fname):

733

def linknodes(unused, fname):

734

return fnodes.get(fname, {})

734

return fnodes.get(fname, {})

735

else:

735

else:

736

cln = cl.node

736

cln = cl.node

737

def linknodes(filerevlog, fname):

737

def linknodes(filerevlog, fname):

738

llr = filerevlog.linkrev

738

llr = filerevlog.linkrev

739

fln = filerevlog.node

739

fln = filerevlog.node

740

revs = ((r, llr(r)) for r in filerevlog)

740

revs = ((r, llr(r)) for r in filerevlog)

741

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

741

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

742

743

changedfiles = set()

743

changedfiles = set()

744

for x in mfchangedfiles.itervalues():

744

for x in mfchangedfiles.itervalues():

745

changedfiles.update(x)

745

changedfiles.update(x)

746

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

746

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

747

source):

747

source):

748

yield chunk

748

yield chunk

749

750

yield self.close()

750

yield self.close()

751

752

if clnodes:

752

if clnodes:

753

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

753

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

754

755

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

755

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

756

mfchangedfiles, fnodes):

756

mfchangedfiles, fnodes):

757

repo = self._repo

757

repo = self._repo

758

ml = repo.manifest

758

ml = repo.manifest

759

tmfnodes = {}

759

tmfnodes = {}

760

761

# Callback for the manifest, used to collect linkrevs for filelog

761

# Callback for the manifest, used to collect linkrevs for filelog

762

# revisions.

762

# revisions.

763

# Returns the linkrev node (collected in lookupcl).

763

# Returns the linkrev node (collected in lookupcl).

764

if fastpathlinkrev:

764

if fastpathlinkrev:

765

lookupmflinknode = mfs.__getitem__

765

lookupmflinknode = mfs.__getitem__

766

else:

766

else:

767

def lookupmflinknode(x):

767

def lookupmflinknode(x):

768

"""Callback for looking up the linknode for manifests.

768

"""Callback for looking up the linknode for manifests.

769

770

Returns the linkrev node for the specified manifest.

770

Returns the linkrev node for the specified manifest.

771

772

SIDE EFFECT:

772

SIDE EFFECT:

773

774

1) fclnodes gets populated with the list of relevant

774

1) fclnodes gets populated with the list of relevant

775

file nodes if we're not using fastpathlinkrev

775

file nodes if we're not using fastpathlinkrev

776

2) When treemanifests are in use, collects treemanifest nodes

776

2) When treemanifests are in use, collects treemanifest nodes

777

to send

777

to send

778

779

Note that this means manifests must be completely sent to

779

Note that this means manifests must be completely sent to

780

the client before you can trust the list of files and

780

the client before you can trust the list of files and

781

treemanifests to send.

781

treemanifests to send.

782

"""

782

"""

783

clnode = mfs[x]

783

clnode = mfs[x]

784

# We no longer actually care about reading deltas of

784

# We no longer actually care about reading deltas of

785

# the manifest here, because we already know the list

785

# the manifest here, because we already know the list

786

# of changed files, so for treemanifests (which

786

# of changed files, so for treemanifests (which

787

# lazily-load anyway to *generate* a readdelta) we can

787

# lazily-load anyway to *generate* a readdelta) we can

788

# just load them with read() and then we'll actually

788

# just load them with read() and then we'll actually

789

# be able to correctly load node IDs from the

789

# be able to correctly load node IDs from the

790

# submanifest entries.

790

# submanifest entries.

791

if 'treemanifest' in repo.requirements:

791

if 'treemanifest' in repo.requirements:

792

mdata = ml.read(x)

792

mdata = ml.read(x)

793

else:

793

else:

794

mdata = ml.readfast(x)

794

mdata = ml.readfast(x)

795

for f in mfchangedfiles[x]:

795

for f in mfchangedfiles[x]:

796

try:

796

try:

797

n = mdata[f]

797

n = mdata[f]

798

except KeyError:

798

except KeyError:

799

continue

799

continue

800

# record the first changeset introducing this filelog

800

# record the first changeset introducing this filelog

801

# version

801

# version

802

fclnodes = fnodes.setdefault(f, {})

802

fclnodes = fnodes.setdefault(f, {})

803

fclnode = fclnodes.setdefault(n, clnode)

803

fclnode = fclnodes.setdefault(n, clnode)

804

if clrevorder[clnode] < clrevorder[fclnode]:

804

if clrevorder[clnode] < clrevorder[fclnode]:

805

fclnodes[n] = clnode

805

fclnodes[n] = clnode

806

# gather list of changed treemanifest nodes

806

# gather list of changed treemanifest nodes

807

if 'treemanifest' in repo.requirements:

807

if 'treemanifest' in repo.requirements:

808

submfs = {'/': mdata}

808

submfs = {'/': mdata}

809

for dn, bn in _moddirs(mfchangedfiles[x]):

809

for dn, bn in _moddirs(mfchangedfiles[x]):

810

try:

810

try:

811

submf = submfs[dn]

811

submf = submfs[dn]

812

submf = submf._dirs[bn]

812

submf = submf._dirs[bn]

813

except KeyError:

813

except KeyError:

814

continue # deleted directory, so nothing to send

814

continue # deleted directory, so nothing to send

815

submfs[submf.dir()] = submf

815

submfs[submf.dir()] = submf

816

tmfclnodes = tmfnodes.setdefault(submf.dir(), {})

816

tmfclnodes = tmfnodes.setdefault(submf.dir(), {})

817

tmfclnode = tmfclnodes.setdefault(submf._node, clnode)

817

tmfclnode = tmfclnodes.setdefault(submf._node, clnode)

818

if clrevorder[clnode] < clrevorder[tmfclnode]:

818

if clrevorder[clnode] < clrevorder[tmfclnode]:

819

tmfclnodes[n] = clnode

819

tmfclnodes[n] = clnode

820

return clnode

820

return clnode

821

822

mfnodes = self.prune(ml, mfs, commonrevs)

822

mfnodes = self.prune(ml, mfs, commonrevs)

823

size = 0

823

size = 0

824

for x in self._packmanifests('', mfnodes, lookupmflinknode):

824

for x in self._packmanifests('', mfnodes, lookupmflinknode):

825

size += len(x)

825

size += len(x)

826

yield x

826

yield x

827

for dir, nodes in tmfnodes.iteritems():

827

for dir, nodes in tmfnodes.iteritems():

828

for x in self._packmanifests(dir, nodes, nodes.get):

828

prunednodes = self.prune(ml.dirlog(dir), nodes, commonrevs)

829

for x in self._packmanifests(dir, prunednodes, nodes.get):

829

size += len(x)

830

size += len(x)

830

yield x

831

yield x

831

self._verbosenote(_('%8.i (manifests)\n') % size)

832

self._verbosenote(_('%8.i (manifests)\n') % size)

832

yield self._manifestsdone()

833

yield self._manifestsdone()

833

834

# The 'source' parameter is useful for extensions

835

# The 'source' parameter is useful for extensions

835

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

836

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

836

repo = self._repo

837

repo = self._repo

837

progress = self._progress

838

progress = self._progress

838

msgbundling = _('bundling')

839

msgbundling = _('bundling')

839

840

total = len(changedfiles)

841

total = len(changedfiles)

841

# for progress output

842

# for progress output

842

msgfiles = _('files')

843

msgfiles = _('files')

843

for i, fname in enumerate(sorted(changedfiles)):

844

for i, fname in enumerate(sorted(changedfiles)):

844

filerevlog = repo.file(fname)

845

filerevlog = repo.file(fname)

845

if not filerevlog:

846

if not filerevlog:

846

raise error.Abort(_("empty or missing revlog for %s") % fname)

847

raise error.Abort(_("empty or missing revlog for %s") % fname)

847

848

linkrevnodes = linknodes(filerevlog, fname)

849

linkrevnodes = linknodes(filerevlog, fname)

849

# Lookup for filenodes, we collected the linkrev nodes above in the

850

# Lookup for filenodes, we collected the linkrev nodes above in the

850

# fastpath case and with lookupmf in the slowpath case.

851

# fastpath case and with lookupmf in the slowpath case.

851

def lookupfilelog(x):

852

def lookupfilelog(x):

852

return linkrevnodes[x]

853

return linkrevnodes[x]

853

854

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

855

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

855

if filenodes:

856

if filenodes:

856

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

857

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

857

total=total)

858

total=total)

858

h = self.fileheader(fname)

859

h = self.fileheader(fname)

859

size = len(h)

860

size = len(h)

860

yield h

861

yield h

861

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

862

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

862

size += len(chunk)

863

size += len(chunk)

863

yield chunk

864

yield chunk

864

self._verbosenote(_('%8.i %s\n') % (size, fname))

865

self._verbosenote(_('%8.i %s\n') % (size, fname))

865

progress(msgbundling, None)

866

progress(msgbundling, None)

866

867

def deltaparent(self, revlog, rev, p1, p2, prev):

868

def deltaparent(self, revlog, rev, p1, p2, prev):

868

return prev

869

return prev

869

870

def revchunk(self, revlog, rev, prev, linknode):

871

def revchunk(self, revlog, rev, prev, linknode):

871

node = revlog.node(rev)

872

node = revlog.node(rev)

872

p1, p2 = revlog.parentrevs(rev)

873

p1, p2 = revlog.parentrevs(rev)

873

base = self.deltaparent(revlog, rev, p1, p2, prev)

874

base = self.deltaparent(revlog, rev, p1, p2, prev)

874

875

prefix = ''

876

prefix = ''

876

if revlog.iscensored(base) or revlog.iscensored(rev):

877

if revlog.iscensored(base) or revlog.iscensored(rev):

877

try:

878

try:

878

delta = revlog.revision(node)

879

delta = revlog.revision(node)

879

except error.CensoredNodeError as e:

880

except error.CensoredNodeError as e:

880

delta = e.tombstone

881

delta = e.tombstone

881

if base == nullrev:

882

if base == nullrev:

882

prefix = mdiff.trivialdiffheader(len(delta))

883

prefix = mdiff.trivialdiffheader(len(delta))

883

else:

884

else:

884

baselen = revlog.rawsize(base)

885

baselen = revlog.rawsize(base)

885

prefix = mdiff.replacediffheader(baselen, len(delta))

886

prefix = mdiff.replacediffheader(baselen, len(delta))

886

elif base == nullrev:

887

elif base == nullrev:

887

delta = revlog.revision(node)

888

delta = revlog.revision(node)

888

prefix = mdiff.trivialdiffheader(len(delta))

889

prefix = mdiff.trivialdiffheader(len(delta))

889

else:

890

else:

890

delta = revlog.revdiff(base, rev)

891

delta = revlog.revdiff(base, rev)

891

p1n, p2n = revlog.parents(node)

892

p1n, p2n = revlog.parents(node)

892

basenode = revlog.node(base)

893

basenode = revlog.node(base)

893

flags = revlog.flags(rev)

894

flags = revlog.flags(rev)

894

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)

895

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)

895

meta += prefix

896

meta += prefix

896

l = len(meta) + len(delta)

897

l = len(meta) + len(delta)

897

yield chunkheader(l)

898

yield chunkheader(l)

898

yield meta

899

yield meta

899

yield delta

900

yield delta

900

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

901

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

901

# do nothing with basenode, it is implicitly the previous one in HG10

902

# do nothing with basenode, it is implicitly the previous one in HG10

902

# do nothing with flags, it is implicitly 0 for cg1 and cg2

903

# do nothing with flags, it is implicitly 0 for cg1 and cg2

903

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

904

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

904

905

class cg2packer(cg1packer):

906

class cg2packer(cg1packer):

906

version = '02'

907

version = '02'

907

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

908

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

908

909

def __init__(self, repo, bundlecaps=None):

910

def __init__(self, repo, bundlecaps=None):

910

super(cg2packer, self).__init__(repo, bundlecaps)

911

super(cg2packer, self).__init__(repo, bundlecaps)

911

if self._reorder is None:

912

if self._reorder is None:

912

# Since generaldelta is directly supported by cg2, reordering

913

# Since generaldelta is directly supported by cg2, reordering

913

# generally doesn't help, so we disable it by default (treating

914

# generally doesn't help, so we disable it by default (treating

914

# bundle.reorder=auto just like bundle.reorder=False).

915

# bundle.reorder=auto just like bundle.reorder=False).

915

self._reorder = False

916

self._reorder = False

916

917

def deltaparent(self, revlog, rev, p1, p2, prev):

918

def deltaparent(self, revlog, rev, p1, p2, prev):

918

dp = revlog.deltaparent(rev)

919

dp = revlog.deltaparent(rev)

919

# avoid storing full revisions; pick prev in those cases

920

# avoid storing full revisions; pick prev in those cases

920

# also pick prev when we can't be sure remote has dp

921

# also pick prev when we can't be sure remote has dp

921

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

922

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

922

return prev

923

return prev

923

return dp

924

return dp

924

925

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

926

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

926

# Do nothing with flags, it is implicitly 0 in cg1 and cg2

927

# Do nothing with flags, it is implicitly 0 in cg1 and cg2

927

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

928

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

928

929

class cg3packer(cg2packer):

930

class cg3packer(cg2packer):

930

version = '03'

931

version = '03'

931

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

932

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

932

933

def _packmanifests(self, dir, mfnodes, lookuplinknode):

934

def _packmanifests(self, dir, mfnodes, lookuplinknode):

934

if dir:

935

if dir:

935

yield self.fileheader(dir)

936

yield self.fileheader(dir)

936

for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),

937

for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),

937

lookuplinknode, units=_('manifests')):

938

lookuplinknode, units=_('manifests')):

938

yield chunk

939

yield chunk

939

940

def _manifestsdone(self):

941

def _manifestsdone(self):

941

return self.close()

942

return self.close()

942

943

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

944

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

944

return struct.pack(

945

return struct.pack(

945

self.deltaheader, node, p1n, p2n, basenode, linknode, flags)

946

self.deltaheader, node, p1n, p2n, basenode, linknode, flags)

946

947

_packermap = {'01': (cg1packer, cg1unpacker),

948

_packermap = {'01': (cg1packer, cg1unpacker),

948

# cg2 adds support for exchanging generaldelta

949

# cg2 adds support for exchanging generaldelta

949

'02': (cg2packer, cg2unpacker),

950

'02': (cg2packer, cg2unpacker),

950

# cg3 adds support for exchanging revlog flags and treemanifests

951

# cg3 adds support for exchanging revlog flags and treemanifests

951

'03': (cg3packer, cg3unpacker),

952

'03': (cg3packer, cg3unpacker),

952

}

953

}

953

954

def allsupportedversions(ui):

955

def allsupportedversions(ui):

955

versions = set(_packermap.keys())

956

versions = set(_packermap.keys())

956

versions.discard('03')

957

versions.discard('03')

957

if (ui.configbool('experimental', 'changegroup3') or

958

if (ui.configbool('experimental', 'changegroup3') or

958

ui.configbool('experimental', 'treemanifest')):

959

ui.configbool('experimental', 'treemanifest')):

959

versions.add('03')

960

versions.add('03')

960

return versions

961

return versions

961

962

# Changegroup versions that can be applied to the repo

963

# Changegroup versions that can be applied to the repo

963

def supportedincomingversions(repo):

964

def supportedincomingversions(repo):

964

versions = allsupportedversions(repo.ui)

965

versions = allsupportedversions(repo.ui)

965

if 'treemanifest' in repo.requirements:

966

if 'treemanifest' in repo.requirements:

966

versions.add('03')

967

versions.add('03')

967

return versions

968

return versions

968

969

# Changegroup versions that can be created from the repo

970

# Changegroup versions that can be created from the repo

970

def supportedoutgoingversions(repo):

971

def supportedoutgoingversions(repo):

971

versions = allsupportedversions(repo.ui)

972

versions = allsupportedversions(repo.ui)

972

if 'treemanifest' in repo.requirements:

973

if 'treemanifest' in repo.requirements:

973

# Versions 01 and 02 support only flat manifests and it's just too

974

# Versions 01 and 02 support only flat manifests and it's just too

974

# expensive to convert between the flat manifest and tree manifest on

975

# expensive to convert between the flat manifest and tree manifest on

975

# the fly. Since tree manifests are hashed differently, all of history

976

# the fly. Since tree manifests are hashed differently, all of history

976

# would have to be converted. Instead, we simply don't even pretend to

977

# would have to be converted. Instead, we simply don't even pretend to

977

# support versions 01 and 02.

978

# support versions 01 and 02.

978

versions.discard('01')

979

versions.discard('01')

979

versions.discard('02')

980

versions.discard('02')

980

versions.add('03')

981

versions.add('03')

981

return versions

982

return versions

982

983

def safeversion(repo):

984

def safeversion(repo):

984

# Finds the smallest version that it's safe to assume clients of the repo

985

# Finds the smallest version that it's safe to assume clients of the repo

985

# will support. For example, all hg versions that support generaldelta also

986

# will support. For example, all hg versions that support generaldelta also

986

# support changegroup 02.

987

# support changegroup 02.

987

versions = supportedoutgoingversions(repo)

988

versions = supportedoutgoingversions(repo)

988

if 'generaldelta' in repo.requirements:

989

if 'generaldelta' in repo.requirements:

989

versions.discard('01')

990

versions.discard('01')

990

assert versions

991

assert versions

991

return min(versions)

992

return min(versions)

992

993

def getbundler(version, repo, bundlecaps=None):

994

def getbundler(version, repo, bundlecaps=None):

994

assert version in supportedoutgoingversions(repo)

995

assert version in supportedoutgoingversions(repo)

995

return _packermap[version][0](repo, bundlecaps)

996

return _packermap[version][0](repo, bundlecaps)

996

997

def getunbundler(version, fh, alg):

998

def getunbundler(version, fh, alg):

998

return _packermap[version][1](fh, alg)

999

return _packermap[version][1](fh, alg)

999

1000

def _changegroupinfo(repo, nodes, source):

1001

def _changegroupinfo(repo, nodes, source):

1001

if repo.ui.verbose or source == 'bundle':

1002

if repo.ui.verbose or source == 'bundle':

1002

repo.ui.status(_("%d changesets found\n") % len(nodes))

1003

repo.ui.status(_("%d changesets found\n") % len(nodes))

1003

if repo.ui.debugflag:

1004

if repo.ui.debugflag:

1004

repo.ui.debug("list of changesets:\n")

1005

repo.ui.debug("list of changesets:\n")

1005

for node in nodes:

1006

for node in nodes:

1006

repo.ui.debug("%s\n" % hex(node))

1007

repo.ui.debug("%s\n" % hex(node))

1007

1008

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

1009

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

1009

repo = repo.unfiltered()

1010

repo = repo.unfiltered()

1010

commonrevs = outgoing.common

1011

commonrevs = outgoing.common

1011

csets = outgoing.missing

1012

csets = outgoing.missing

1012

heads = outgoing.missingheads

1013

heads = outgoing.missingheads

1013

# We go through the fast path if we get told to, or if all (unfiltered

1014

# We go through the fast path if we get told to, or if all (unfiltered

1014

# heads have been requested (since we then know there all linkrevs will

1015

# heads have been requested (since we then know there all linkrevs will

1015

# be pulled by the client).

1016

# be pulled by the client).

1016

heads.sort()

1017

heads.sort()

1017

fastpathlinkrev = fastpath or (

1018

fastpathlinkrev = fastpath or (

1018

repo.filtername is None and heads == sorted(repo.heads()))

1019

repo.filtername is None and heads == sorted(repo.heads()))

1019

1020

repo.hook('preoutgoing', throw=True, source=source)

1021

repo.hook('preoutgoing', throw=True, source=source)

1021

_changegroupinfo(repo, csets, source)

1022

_changegroupinfo(repo, csets, source)

1022

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1023

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1023

1024

def getsubset(repo, outgoing, bundler, source, fastpath=False):

1025

def getsubset(repo, outgoing, bundler, source, fastpath=False):

1025

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

1026

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

1026

return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)

1027

return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)

1027

1028

def changegroupsubset(repo, roots, heads, source, version='01'):

1029

def changegroupsubset(repo, roots, heads, source, version='01'):

1029

"""Compute a changegroup consisting of all the nodes that are

1030

"""Compute a changegroup consisting of all the nodes that are

1030

descendants of any of the roots and ancestors of any of the heads.

1031

descendants of any of the roots and ancestors of any of the heads.

1031

Return a chunkbuffer object whose read() method will return

1032

Return a chunkbuffer object whose read() method will return

1032

successive changegroup chunks.

1033

successive changegroup chunks.

1033

1034

It is fairly complex as determining which filenodes and which

1035

It is fairly complex as determining which filenodes and which

1035

manifest nodes need to be included for the changeset to be complete

1036

manifest nodes need to be included for the changeset to be complete

1036

is non-trivial.

1037

is non-trivial.

1037

1038

Another wrinkle is doing the reverse, figuring out which changeset in

1039

Another wrinkle is doing the reverse, figuring out which changeset in

1039

the changegroup a particular filenode or manifestnode belongs to.

1040

the changegroup a particular filenode or manifestnode belongs to.

1040

"""

1041

"""

1041

cl = repo.changelog

1042

cl = repo.changelog

1042

if not roots:

1043

if not roots:

1043

roots = [nullid]

1044

roots = [nullid]

1044

discbases = []

1045

discbases = []

1045

for n in roots:

1046

for n in roots:

1046

discbases.extend([p for p in cl.parents(n) if p != nullid])

1047

discbases.extend([p for p in cl.parents(n) if p != nullid])

1047

# TODO: remove call to nodesbetween.

1048

# TODO: remove call to nodesbetween.

1048

csets, roots, heads = cl.nodesbetween(roots, heads)

1049

csets, roots, heads = cl.nodesbetween(roots, heads)

1049

included = set(csets)

1050

included = set(csets)

1050

discbases = [n for n in discbases if n not in included]

1051

discbases = [n for n in discbases if n not in included]

1051

outgoing = discovery.outgoing(cl, discbases, heads)

1052

outgoing = discovery.outgoing(cl, discbases, heads)

1052

bundler = getbundler(version, repo)

1053

bundler = getbundler(version, repo)

1053

return getsubset(repo, outgoing, bundler, source)

1054

return getsubset(repo, outgoing, bundler, source)

1054

1055

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

1056

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

1056

version='01'):

1057

version='01'):

1057

"""Like getbundle, but taking a discovery.outgoing as an argument.

1058

"""Like getbundle, but taking a discovery.outgoing as an argument.

1058

1059

This is only implemented for local repos and reuses potentially

1060

This is only implemented for local repos and reuses potentially

1060

precomputed sets in outgoing. Returns a raw changegroup generator."""

1061

precomputed sets in outgoing. Returns a raw changegroup generator."""

1061

if not outgoing.missing:

1062

if not outgoing.missing:

1062

return None

1063

return None

1063

bundler = getbundler(version, repo, bundlecaps)

1064

bundler = getbundler(version, repo, bundlecaps)

1064

return getsubsetraw(repo, outgoing, bundler, source)

1065

return getsubsetraw(repo, outgoing, bundler, source)

1065

1066

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

1067

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

1067

version='01'):

1068

version='01'):

1068

"""Like getbundle, but taking a discovery.outgoing as an argument.

1069

"""Like getbundle, but taking a discovery.outgoing as an argument.

1069

1070

This is only implemented for local repos and reuses potentially

1071

This is only implemented for local repos and reuses potentially

1071

precomputed sets in outgoing."""

1072

precomputed sets in outgoing."""

1072

if not outgoing.missing:

1073

if not outgoing.missing:

1073

return None

1074

return None

1074

bundler = getbundler(version, repo, bundlecaps)

1075

bundler = getbundler(version, repo, bundlecaps)

1075

return getsubset(repo, outgoing, bundler, source)

1076

return getsubset(repo, outgoing, bundler, source)

1076

1077

def computeoutgoing(repo, heads, common):

1078

def computeoutgoing(repo, heads, common):

1078

"""Computes which revs are outgoing given a set of common

1079

"""Computes which revs are outgoing given a set of common

1079

and a set of heads.

1080

and a set of heads.

1080

1081

This is a separate function so extensions can have access to

1082

This is a separate function so extensions can have access to

1082

the logic.

1083

the logic.

1083

1084

Returns a discovery.outgoing object.

1085

Returns a discovery.outgoing object.

1085

"""

1086

"""

1086

cl = repo.changelog

1087

cl = repo.changelog

1087

if common:

1088

if common:

1088

hasnode = cl.hasnode

1089

hasnode = cl.hasnode

1089

common = [n for n in common if hasnode(n)]

1090

common = [n for n in common if hasnode(n)]

1090

else:

1091

else:

1091

common = [nullid]

1092

common = [nullid]

1092

if not heads:

1093

if not heads:

1093

heads = cl.heads()

1094

heads = cl.heads()

1094

return discovery.outgoing(cl, common, heads)

1095

return discovery.outgoing(cl, common, heads)

1095

1096

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

1097

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

1097

version='01'):

1098

version='01'):

1098

"""Like changegroupsubset, but returns the set difference between the

1099

"""Like changegroupsubset, but returns the set difference between the

1099

ancestors of heads and the ancestors common.

1100

ancestors of heads and the ancestors common.

1100

1101

If heads is None, use the local heads. If common is None, use [nullid].

1102

If heads is None, use the local heads. If common is None, use [nullid].

1102

1103

The nodes in common might not all be known locally due to the way the

1104

The nodes in common might not all be known locally due to the way the

1104

current discovery protocol works.

1105

current discovery protocol works.

1105

"""

1106

"""

1106

outgoing = computeoutgoing(repo, heads, common)

1107

outgoing = computeoutgoing(repo, heads, common)

1107

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

1108

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

1108

version=version)

1109

version=version)

1109

1110

def changegroup(repo, basenodes, source):

1111

def changegroup(repo, basenodes, source):

1111

# to avoid a race we use changegroupsubset() (issue1320)

1112

# to avoid a race we use changegroupsubset() (issue1320)

1112

return changegroupsubset(repo, basenodes, repo.heads(), source)

1113

return changegroupsubset(repo, basenodes, repo.heads(), source)

1113

1114

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

1115

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

1115

revisions = 0

1116

revisions = 0

1116

files = 0

1117

files = 0

1117

while True:

1118

while True:

1118

chunkdata = source.filelogheader()

1119

chunkdata = source.filelogheader()

1119

if not chunkdata:

1120

if not chunkdata:

1120

break

1121

break

1121

f = chunkdata["filename"]

1122

f = chunkdata["filename"]

1122

repo.ui.debug("adding %s revisions\n" % f)

1123

repo.ui.debug("adding %s revisions\n" % f)

1123

pr()

1124

pr()

1124

fl = repo.file(f)

1125

fl = repo.file(f)

1125

o = len(fl)

1126

o = len(fl)

1126

try:

1127

try:

1127

if not fl.addgroup(source, revmap, trp):

1128

if not fl.addgroup(source, revmap, trp):

1128

raise error.Abort(_("received file revlog group is empty"))

1129

raise error.Abort(_("received file revlog group is empty"))

1129

except error.CensoredBaseError as e:

1130

except error.CensoredBaseError as e:

1130

raise error.Abort(_("received delta base is censored: %s") % e)

1131

raise error.Abort(_("received delta base is censored: %s") % e)

1131

revisions += len(fl) - o

1132

revisions += len(fl) - o

1132

files += 1

1133

files += 1

1133

if f in needfiles:

1134

if f in needfiles:

1134

needs = needfiles[f]

1135

needs = needfiles[f]

1135

for new in xrange(o, len(fl)):

1136

for new in xrange(o, len(fl)):

1136

n = fl.node(new)

1137

n = fl.node(new)

1137

if n in needs:

1138

if n in needs:

1138

needs.remove(n)

1139

needs.remove(n)

1139

else:

1140

else:

1140

raise error.Abort(

1141

raise error.Abort(

1141

_("received spurious file revlog entry"))

1142

_("received spurious file revlog entry"))

1142

if not needs:

1143

if not needs:

1143

del needfiles[f]

1144

del needfiles[f]

1144

repo.ui.progress(_('files'), None)

1145

repo.ui.progress(_('files'), None)

1145

1146

for f, needs in needfiles.iteritems():

1147

for f, needs in needfiles.iteritems():

1147

fl = repo.file(f)

1148

fl = repo.file(f)

1148

for n in needs:

1149

for n in needs:

1149

try:

1150

try:

1150

fl.rev(n)

1151

fl.rev(n)

1151

except error.LookupError:

1152

except error.LookupError:

1152

raise error.Abort(

1153

raise error.Abort(

1153

_('missing file data for %s:%s - run hg verify') %

1154

_('missing file data for %s:%s - run hg verify') %

1154

(f, hex(n)))

1155

(f, hex(n)))

1155

1156

return revisions, files

1157

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import tempfile
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from . import (
                 branchmap,
                 dagutil,
                 discovery,
                 error,
                 mdiff,
                 phases,
                 util,
             )
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             _CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             bundletypes = {
                 "": ("", None),       # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", None),
                 "HG10BZ": ("HG10", 'BZ'),
                 "HG10GZ": ("HG10GZ", 'GZ'),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 if bundletype == "HG20":
                     from . import bundle2
                     bundle = bundle2.bundle20(ui)
                     bundle.setcompression(compression)
                     part = bundle.newpart('changegroup', data=cg.getchunks())
                     part.addparam('version', cg.version)
                     chunkiter = bundle.getchunks()
                 else:
                     # compression argument is only for the bundle2 case
                     assert compression is None
                     if cg.version != '01':
                         raise error.Abort(_('old bundle types only supports v1 '
                                             'changegroups'))
                     header, comp = bundletypes[bundletype]
                     if comp not in util.compressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                           % comp)
                     z = util.compressors[comp]()
                     subchunkiter = cg.getchunks()
                     def chunkiter():
                         yield header
                         for chunk in subchunkiter:
                             yield z.compress(chunk)
                         yield z.flush()
                     chunkiter = chunkiter()
                 # parse the changegroup data, otherwise we will block
                 # in case of sshrepo because we don't know the end of the stream
                 # an empty chunkgroup is the end of the changegroup
                 # a changegroup has at least 2 chunkgroups (changelog and manifest).
                 # after that, an empty chunkgroup is the end of the changegroup
                 return writechunks(ui, chunkiter, filename, vfs=vfs)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 _grouplistcount = 1 # One list of files after the manifests
                 def __init__(self, fh, alg):
                     if alg == 'UN':
                         alg = None # get more modern without breaking too much
                     if not alg in util.decompressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     self._stream = util.decompressors[alg](fh)
                     self._type = alg
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta, 'flags': flags}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, changegroup versions 1 and 2 have a series of groups
                     # with one group per file. changegroup 3 has a series of directory
                     # manifests before the files.
                     count = 0
                     emptycount = 0
                     while emptycount < self._grouplistcount:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 if empty and count > 2:
                                     emptycount += 1
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     # We know that we'll never have more manifests than we had
                     # changesets.
                     self.callback = prog(_('manifests'), numchanges)
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     repo.manifest.addgroup(self, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                 def apply(self, repo, srctype, url, emptyok=False,
                           targetphase=phases.draft, expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     try:
                         with repo.transaction("\n".join([srctype,
                                                          util.hidepassword(url)])) as tr:
                             # The transaction could have been created before and already
                             # carries source information. In this case we use the top
                             # level data. We overwrite the argument because we need to use
                             # the top level value (if they exist) in this function.
                             srctype = tr.hookargs.setdefault('source', srctype)
                             url = tr.hookargs.setdefault('url', url)
                             repo.hook('prechangegroup', throw=True, **tr.hookargs)
                             # write changelog data to temp files so concurrent readers
                             # will not see an inconsistent view
                             cl = repo.changelog
                             cl.delayupdate(tr)
                             oldheads = cl.heads()
                             trp = weakref.proxy(tr)
                             # pull off the changeset group
                             repo.ui.status(_("adding changesets\n"))
                             clstart = len(cl)
                             class prog(object):
                                 def __init__(self, step, total):
                                     self._step = step
                                     self._total = total
                                     self._count = 1
                                 def __call__(self):
                                     repo.ui.progress(self._step, self._count,
                                                      unit=_('chunks'), total=self._total)
                                     self._count += 1
                             self.callback = prog(_('changesets'), expectedtotal)
                             efiles = set()
                             def onchangelog(cl, node):
                                 efiles.update(cl.read(node)[3])
                             self.changelogheader()
                             srccontent = cl.addgroup(self, csmap, trp,
                                                      addrevisioncb=onchangelog)
                             efiles = len(efiles)
                             if not (srccontent or emptyok):
                                 raise error.Abort(_("received changelog group is empty"))
                             clend = len(cl)
                             changesets = clend - clstart
                             repo.ui.progress(_('changesets'), None)
                             # pull off the manifest group
                             repo.ui.status(_("adding manifests\n"))
                             self._unpackmanifests(repo, revmap, trp, prog, changesets)
                             needfiles = {}
                             if repo.ui.configbool('server', 'validate', default=False):
                                 # validate incoming csets have their manifests
                                 for cset in xrange(clstart, clend):
                                     mfnode = repo.changelog.read(
                                         repo.changelog.node(cset))[0]
                                     mfest = repo.manifest.readdelta(mfnode)
                                     # store file nodes we must see
                                     for f, n in mfest.iteritems():
                                         needfiles.setdefault(f, set()).add(n)
                             # process the files
                             repo.ui.status(_("adding file changes\n"))
                             self.callback = None
                             pr = prog(_('files'), efiles)
                             newrevs, newfiles = _addchangegroupfiles(
                                 repo, self, revmap, trp, pr, needfiles)
                             revisions += newrevs
                             files += newfiles
                             dh = 0
                             if oldheads:
                                 heads = cl.heads()
                                 dh = len(heads) - len(oldheads)
                                 for h in heads:
                                     if h not in oldheads and repo[h].closesbranch():
                                         dh -= 1
                             htext = ""
                             if dh:
                                 htext = _(" (%+d heads)") % dh
                             repo.ui.status(_("added %d changesets"
                                              " with %d changes to %d files%s\n")
                                              % (changesets, revisions, files, htext))
                             repo.invalidatevolatilesets()
                             if changesets > 0:
                                 if 'node' not in tr.hookargs:
                                     tr.hookargs['node'] = hex(cl.node(clstart))
                                     tr.hookargs['node_last'] = hex(cl.node(clend - 1))
                                     hookargs = dict(tr.hookargs)
                                 else:
                                     hookargs = dict(tr.hookargs)
                                     hookargs['node'] = hex(cl.node(clstart))
                                     hookargs['node_last'] = hex(cl.node(clend - 1))
                                 repo.hook('pretxnchangegroup', throw=True, **hookargs)
                             added = [cl.node(r) for r in xrange(clstart, clend)]
                             publishing = repo.publishing()
                             if srctype in ('push', 'serve'):
                                 # Old servers can not push the boundary themselves.
                                 # New servers won't push the boundary if changeset already
                                 # exists locally as secret
                                 #
                                 # We should not use added here but the list of all change in
                                 # the bundle
                                 if publishing:
                                     phases.advanceboundary(repo, tr, phases.public,
                                                            srccontent)
                                 else:
                                     # Those changesets have been pushed from the
                                     # outside, their phases are going to be pushed
                                     # alongside. Therefor `targetphase` is
                                     # ignored.
                                     phases.advanceboundary(repo, tr, phases.draft,
                                                            srccontent)
                                     phases.retractboundary(repo, tr, phases.draft, added)
                             elif srctype != 'strip':
                                 # publishing only alter behavior during push
                                 #
                                 # strip should not touch boundary at all
                                 phases.retractboundary(repo, tr, targetphase, added)
                             if changesets > 0:
                                 if srctype != 'strip':
                                     # During strip, branchcache is invalid but
                                     # coming call to `destroyed` will repair it.
                                     # In other case we can safely update cache on
                                     # disk.
                                     branchmap.updatecache(repo.filtered('served'))
                                 def runhooks():
                                     # These hooks run when the lock releases, not when the
                                     # transaction closes. So it's possible for the changelog
                                     # to have changed since we last saw it.
                                     if clstart >= len(repo):
                                         return
                                     # forcefully update the on-disk branch cache
                                     repo.ui.debug("updating the branch cache\n")
                                     repo.hook("changegroup", **hookargs)
                                     for n in added:
                                         args = hookargs.copy()
                                         args['node'] = hex(n)
                                         del args['node_last']
                                         repo.hook("incoming", **args)
                                     newheads = [h for h in repo.heads()
                                                 if h not in oldheads]
                                     repo.ui.log("incoming",
                                                 "%s incoming changes - new heads: %s\n",
                                                 len(added),
                                                 ', '.join([hex(c[:6]) for c in newheads]))
                                 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                                 lambda tr: repo._afterlock(runhooks))
                     finally:
                         repo.ui.flush()
                     # never return 0 here:
                     if dh < 0:
                         return dh - 1
                     else:
                         return dh + 1
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
             class cg3unpacker(cg2unpacker):
                 """Unpacker for cg3 streams.
                 cg3 streams add support for exchanging treemanifests and revlog
                 flags. It adds the revlog flags to the delta header and an empty chunk
                 separating manifests and files.
                 """
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '03'
                 _grouplistcount = 2 # One list of manifests and one list of files
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs, flags = headertuple
                     return node, p1, p2, deltabase, cs, flags
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,
                                                               numchanges)
                     while True:
                         chunkdata = self.filelogheader()
                         if not chunkdata:
                             break
                         # If we get here, there are directory manifests in the changegroup
                         d = chunkdata["filename"]
                         repo.ui.debug("adding %s revisions\n" % d)
                         dirlog = repo.manifest.dirlog(d)
                         if not dirlog.addgroup(self, revmap, trp):
                             raise error.Abort(_("received dir revlog group is empty"))
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             def _moddirs(files):
                 """Given a set of modified files, find the list of modified directories.
                 This returns a list of (path to changed dir, changed dir) tuples,
                 as that's what the one client needs anyway.
                 >>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])
                 [('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]
                 """
                 alldirs = set()
                 for f in files:
                     path = f.split('/')[:-1]
                     for i in xrange(len(path) - 1, -1, -1):
                         dn = '/'.join(path[:i])
                         current = dn + '/', path[i] + '/'
                         if current in alldirs:
                             break
                         alldirs.add(current)
                 return sorted(alldirs)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     if units is not None:
                         self._progress(msgbundling, None)
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def _packmanifests(self, dir, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
                     assert not dir
                     for chunk in self.group(mfnodes, self._repo.manifest,
                                             lookuplinknode, units=_('manifests')):
                         yield chunk
                 def _manifestsdone(self):
                     return ''
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     # maps manifest node id -> set(changed files)
                     mfchangedfiles = {}
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         n = c[0]
                         # record the first changeset introducing this manifest version
                         mfs.setdefault(n, x)
                         # Record a complete list of potentially-changed files in
                         # this manifest.
                         mfchangedfiles.setdefault(n, set()).update(c[3])
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Treemanifests don't work correctly with fastpathlinkrev
                     # either, because we don't discover which directory nodes to
                     # send along with files. This could probably be fixed.
                     fastpathlinkrev = fastpathlinkrev and (
                         'treemanifest' not in repo.requirements)
                     for chunk in self.generatemanifests(commonrevs, clrevorder,
                             fastpathlinkrev, mfs, mfchangedfiles, fnodes):
                         yield chunk
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     if not fastpathlinkrev:
                         def linknodes(unused, fname):
                             return fnodes.get(fname, {})
                     else:
                         cln = cl.node
                         def linknodes(filerevlog, fname):
                             llr = filerevlog.linkrev
                             fln = filerevlog.node
                             revs = ((r, llr(r)) for r in filerevlog)
                             return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
                     changedfiles = set()
                     for x in mfchangedfiles.itervalues():
                         changedfiles.update(x)
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
                                       mfchangedfiles, fnodes):
                     repo = self._repo
                     ml = repo.manifest
                     tmfnodes = {}
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     if fastpathlinkrev:
                         lookupmflinknode = mfs.__getitem__
                     else:
                         def lookupmflinknode(x):
                             """Callback for looking up the linknode for manifests.
                             Returns the linkrev node for the specified manifest.
                             SIDE EFFECT:
 ) fclnodes gets populated with the list of relevant
                                file nodes if we're not using fastpathlinkrev
 ) When treemanifests are in use, collects treemanifest nodes
                                to send
                             Note that this means manifests must be completely sent to
                             the client before you can trust the list of files and
                             treemanifests to send.
                             """
                             clnode = mfs[x]
                             # We no longer actually care about reading deltas of
                             # the manifest here, because we already know the list
                             # of changed files, so for treemanifests (which
                             # lazily-load anyway to *generate* a readdelta) we can
                             # just load them with read() and then we'll actually
                             # be able to correctly load node IDs from the
                             # submanifest entries.
                             if 'treemanifest' in repo.requirements:
                                 mdata = ml.read(x)
                             else:
                                 mdata = ml.readfast(x)
                             for f in mfchangedfiles[x]:
                                 try:
                                     n = mdata[f]
                                 except KeyError:
                                     continue
                                 # record the first changeset introducing this filelog
                                 # version
                                 fclnodes = fnodes.setdefault(f, {})
                                 fclnode = fclnodes.setdefault(n, clnode)
                                 if clrevorder[clnode] < clrevorder[fclnode]:
                                     fclnodes[n] = clnode
                             # gather list of changed treemanifest nodes
                             if 'treemanifest' in repo.requirements:
                                 submfs = {'/': mdata}
                                 for dn, bn in _moddirs(mfchangedfiles[x]):
                                     try:
                                         submf = submfs[dn]
                                         submf = submf._dirs[bn]
                                     except KeyError:
                                         continue # deleted directory, so nothing to send
                                     submfs[submf.dir()] = submf
                                     tmfclnodes = tmfnodes.setdefault(submf.dir(), {})
                                     tmfclnode = tmfclnodes.setdefault(submf._node, clnode)
                                     if clrevorder[clnode] < clrevorder[tmfclnode]:
                                         tmfclnodes[n] = clnode
                             return clnode
                     mfnodes = self.prune(ml, mfs, commonrevs)
                     size = 0
                     for x in self._packmanifests('', mfnodes, lookupmflinknode):
                         size += len(x)
                         yield x
                     for dir, nodes in tmfnodes.iteritems():
-                        for x in self._packmanifests(dir, nodes, nodes.get):
+                        prunednodes = self.prune(ml.dirlog(dir), nodes, commonrevs)
+                        for x in self._packmanifests(dir, prunednodes, nodes.get):
                             size += len(x)
                             yield x
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                     yield self._manifestsdone()
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress(msgbundling, None)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     flags = revlog.flags(rev)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     # do nothing with flags, it is implicitly 0 for cg1 and cg2
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def __init__(self, repo, bundlecaps=None):
                     super(cg2packer, self).__init__(repo, bundlecaps)
                     if self._reorder is None:
                         # Since generaldelta is directly supported by cg2, reordering
                         # generally doesn't help, so we disable it by default (treating
                         # bundle.reorder=auto just like bundle.reorder=False).
                         self._reorder = False
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     # Do nothing with flags, it is implicitly 0 in cg1 and cg2
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             class cg3packer(cg2packer):
                 version = '03'
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 def _packmanifests(self, dir, mfnodes, lookuplinknode):
                     if dir:
                         yield self.fileheader(dir)
                     for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),
                                             lookuplinknode, units=_('manifests')):
                         yield chunk
                 def _manifestsdone(self):
                     return self.close()
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     return struct.pack(
                         self.deltaheader, node, p1n, p2n, basenode, linknode, flags)
             _packermap = {'01': (cg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (cg2packer, cg2unpacker),
                          # cg3 adds support for exchanging revlog flags and treemanifests
                          '03': (cg3packer, cg3unpacker),
             }
             def allsupportedversions(ui):
                 versions = set(_packermap.keys())
                 versions.discard('03')
                 if (ui.configbool('experimental', 'changegroup3') or
                     ui.configbool('experimental', 'treemanifest')):
                     versions.add('03')
                 return versions
             # Changegroup versions that can be applied to the repo
             def supportedincomingversions(repo):
                 versions = allsupportedversions(repo.ui)
                 if 'treemanifest' in repo.requirements:
                     versions.add('03')
                 return versions
             # Changegroup versions that can be created from the repo
             def supportedoutgoingversions(repo):
                 versions = allsupportedversions(repo.ui)
                 if 'treemanifest' in repo.requirements:
                     # Versions 01 and 02 support only flat manifests and it's just too
                     # expensive to convert between the flat manifest and tree manifest on
                     # the fly. Since tree manifests are hashed differently, all of history
                     # would have to be converted. Instead, we simply don't even pretend to
                     # support versions 01 and 02.
                     versions.discard('01')
                     versions.discard('02')
                     versions.add('03')
                 return versions
             def safeversion(repo):
                 # Finds the smallest version that it's safe to assume clients of the repo
                 # will support. For example, all hg versions that support generaldelta also
                 # support changegroup 02.
                 versions = supportedoutgoingversions(repo)
                 if 'generaldelta' in repo.requirements:
                     versions.discard('01')
                 assert versions
                 return min(versions)
             def getbundler(version, repo, bundlecaps=None):
                 assert version in supportedoutgoingversions(repo)
                 return _packermap[version][0](repo, bundlecaps)
             def getunbundler(version, fh, alg):
                 return _packermap[version][1](fh, alg)
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 included = set(csets)
                 discbases = [n for n in discbases if n not in included]
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = getbundler(version, repo)
                 return getsubset(repo, outgoing, bundler, source)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = getbundler(version, repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,
                                     version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = getbundler(version, repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,
                                version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,
                                            version=version)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files