upstream/mercurial-mirror Commit - r28232:829d369f

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import tempfile

12

import tempfile

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

hex,

17

hex,

18

nullid,

18

nullid,

19

nullrev,

19

nullrev,

20

short,

20

short,

21

)

21

)

22

23

from . import (

23

from . import (

24

branchmap,

24

branchmap,

25

dagutil,

25

dagutil,

26

discovery,

26

discovery,

27

error,

27

error,

28

mdiff,

28

mdiff,

29

phases,

29

phases,

30

util,

30

util,

31

)

31

)

32

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

35

_CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"

35

_CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"

36

37

def readexactly(stream, n):

37

def readexactly(stream, n):

38

'''read n bytes from stream.read and abort if less was available'''

38

'''read n bytes from stream.read and abort if less was available'''

39

s = stream.read(n)

39

s = stream.read(n)

40

if len(s) < n:

40

if len(s) < n:

41

raise error.Abort(_("stream ended unexpectedly"

41

raise error.Abort(_("stream ended unexpectedly"

42

" (got %d bytes, expected %d)")

42

" (got %d bytes, expected %d)")

43

% (len(s), n))

43

% (len(s), n))

44

return s

44

return s

45

46

def getchunk(stream):

46

def getchunk(stream):

47

"""return the next chunk from stream as a string"""

47

"""return the next chunk from stream as a string"""

48

d = readexactly(stream, 4)

48

d = readexactly(stream, 4)

49

l = struct.unpack(">l", d)[0]

49

l = struct.unpack(">l", d)[0]

50

if l <= 4:

50

if l <= 4:

51

if l:

51

if l:

52

raise error.Abort(_("invalid chunk length %d") % l)

52

raise error.Abort(_("invalid chunk length %d") % l)

53

return ""

53

return ""

54

return readexactly(stream, l - 4)

54

return readexactly(stream, l - 4)

55

56

def chunkheader(length):

56

def chunkheader(length):

57

"""return a changegroup chunk header (string)"""

57

"""return a changegroup chunk header (string)"""

58

return struct.pack(">l", length + 4)

58

return struct.pack(">l", length + 4)

59

60

def closechunk():

60

def closechunk():

61

"""return a changegroup chunk header (string) for a zero-length chunk"""

61

"""return a changegroup chunk header (string) for a zero-length chunk"""

62

return struct.pack(">l", 0)

62

return struct.pack(">l", 0)

63

64

def combineresults(results):

64

def combineresults(results):

65

"""logic to combine 0 or more addchangegroup results into one"""

65

"""logic to combine 0 or more addchangegroup results into one"""

66

changedheads = 0

66

changedheads = 0

67

result = 1

67

result = 1

68

for ret in results:

68

for ret in results:

69

# If any changegroup result is 0, return 0

69

# If any changegroup result is 0, return 0

70

if ret == 0:

70

if ret == 0:

71

result = 0

71

result = 0

72

break

72

break

73

if ret < -1:

73

if ret < -1:

74

changedheads += ret + 1

74

changedheads += ret + 1

75

elif ret > 1:

75

elif ret > 1:

76

changedheads += ret - 1

76

changedheads += ret - 1

77

if changedheads > 0:

77

if changedheads > 0:

78

result = 1 + changedheads

78

result = 1 + changedheads

79

elif changedheads < 0:

79

elif changedheads < 0:

80

result = -1 + changedheads

80

result = -1 + changedheads

81

return result

81

return result

82

83

bundletypes = {

83

bundletypes = {

84

"": ("", None), # only when using unbundle on ssh and old http servers

84

"": ("", None), # only when using unbundle on ssh and old http servers

85

# since the unification ssh accepts a header but there

85

# since the unification ssh accepts a header but there

86

# is no capability signaling it.

86

# is no capability signaling it.

87

"HG20": (), # special-cased below

87

"HG20": (), # special-cased below

88

"HG10UN": ("HG10UN", None),

88

"HG10UN": ("HG10UN", None),

89

"HG10BZ": ("HG10", 'BZ'),

89

"HG10BZ": ("HG10", 'BZ'),

90

"HG10GZ": ("HG10GZ", 'GZ'),

90

"HG10GZ": ("HG10GZ", 'GZ'),

91

}

91

}

92

93

# hgweb uses this list to communicate its preferred type

93

# hgweb uses this list to communicate its preferred type

94

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

94

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

95

96

def writechunks(ui, chunks, filename, vfs=None):

96

def writechunks(ui, chunks, filename, vfs=None):

97

"""Write chunks to a file and return its filename.

97

"""Write chunks to a file and return its filename.

98

99

The stream is assumed to be a bundle file.

99

The stream is assumed to be a bundle file.

100

Existing files will not be overwritten.

100

Existing files will not be overwritten.

101

If no filename is specified, a temporary file is created.

101

If no filename is specified, a temporary file is created.

102

"""

102

"""

103

fh = None

103

fh = None

104

cleanup = None

104

cleanup = None

105

try:

105

try:

106

if filename:

106

if filename:

107

if vfs:

107

if vfs:

108

fh = vfs.open(filename, "wb")

108

fh = vfs.open(filename, "wb")

109

else:

109

else:

110

fh = open(filename, "wb")

110

fh = open(filename, "wb")

111

else:

111

else:

112

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

112

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

113

fh = os.fdopen(fd, "wb")

113

fh = os.fdopen(fd, "wb")

114

cleanup = filename

114

cleanup = filename

115

for c in chunks:

115

for c in chunks:

116

fh.write(c)

116

fh.write(c)

117

cleanup = None

117

cleanup = None

118

return filename

118

return filename

119

finally:

119

finally:

120

if fh is not None:

120

if fh is not None:

121

fh.close()

121

fh.close()

122

if cleanup is not None:

122

if cleanup is not None:

123

if filename and vfs:

123

if filename and vfs:

124

vfs.unlink(cleanup)

124

vfs.unlink(cleanup)

125

else:

125

else:

126

os.unlink(cleanup)

126

os.unlink(cleanup)

127

128

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

128

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

129

"""Write a bundle file and return its filename.

129

"""Write a bundle file and return its filename.

130

131

Existing files will not be overwritten.

131

Existing files will not be overwritten.

132

If no filename is specified, a temporary file is created.

132

If no filename is specified, a temporary file is created.

133

bz2 compression can be turned off.

133

bz2 compression can be turned off.

134

The bundle file will be deleted in case of errors.

134

The bundle file will be deleted in case of errors.

135

"""

135

"""

136

137

if bundletype == "HG20":

137

if bundletype == "HG20":

138

from . import bundle2

138

from . import bundle2

139

bundle = bundle2.bundle20(ui)

139

bundle = bundle2.bundle20(ui)

140

bundle.setcompression(compression)

140

bundle.setcompression(compression)

141

part = bundle.newpart('changegroup', data=cg.getchunks())

141

part = bundle.newpart('changegroup', data=cg.getchunks())

142

part.addparam('version', cg.version)

142

part.addparam('version', cg.version)

143

chunkiter = bundle.getchunks()

143

chunkiter = bundle.getchunks()

144

else:

144

else:

145

# compression argument is only for the bundle2 case

145

# compression argument is only for the bundle2 case

146

assert compression is None

146

assert compression is None

147

if cg.version != '01':

147

if cg.version != '01':

148

raise error.Abort(_('old bundle types only supports v1 '

148

raise error.Abort(_('old bundle types only supports v1 '

149

'changegroups'))

149

'changegroups'))

150

header, comp = bundletypes[bundletype]

150

header, comp = bundletypes[bundletype]

151

if comp not in util.compressors:

151

if comp not in util.compressors:

152

raise error.Abort(_('unknown stream compression type: %s')

152

raise error.Abort(_('unknown stream compression type: %s')

153

% comp)

153

% comp)

154

z = util.compressors[comp]()

154

z = util.compressors[comp]()

155

subchunkiter = cg.getchunks()

155

subchunkiter = cg.getchunks()

156

def chunkiter():

156

def chunkiter():

157

yield header

157

yield header

158

for chunk in subchunkiter:

158

for chunk in subchunkiter:

159

yield z.compress(chunk)

159

yield z.compress(chunk)

160

yield z.flush()

160

yield z.flush()

161

chunkiter = chunkiter()

161

chunkiter = chunkiter()

162

163

# parse the changegroup data, otherwise we will block

163

# parse the changegroup data, otherwise we will block

164

# in case of sshrepo because we don't know the end of the stream

164

# in case of sshrepo because we don't know the end of the stream

165

166

# an empty chunkgroup is the end of the changegroup

166

# an empty chunkgroup is the end of the changegroup

167

# a changegroup has at least 2 chunkgroups (changelog and manifest).

167

# a changegroup has at least 2 chunkgroups (changelog and manifest).

168

# after that, an empty chunkgroup is the end of the changegroup

168

# after that, an empty chunkgroup is the end of the changegroup

169

return writechunks(ui, chunkiter, filename, vfs=vfs)

169

return writechunks(ui, chunkiter, filename, vfs=vfs)

170

171

class cg1unpacker(object):

171

class cg1unpacker(object):

172

"""Unpacker for cg1 changegroup streams.

172

"""Unpacker for cg1 changegroup streams.

173

174

A changegroup unpacker handles the framing of the revision data in

174

A changegroup unpacker handles the framing of the revision data in

175

the wire format. Most consumers will want to use the apply()

175

the wire format. Most consumers will want to use the apply()

176

method to add the changes from the changegroup to a repository.

176

method to add the changes from the changegroup to a repository.

177

178

If you're forwarding a changegroup unmodified to another consumer,

178

If you're forwarding a changegroup unmodified to another consumer,

179

use getchunks(), which returns an iterator of changegroup

179

use getchunks(), which returns an iterator of changegroup

180

chunks. This is mostly useful for cases where you need to know the

180

chunks. This is mostly useful for cases where you need to know the

181

data stream has ended by observing the end of the changegroup.

181

data stream has ended by observing the end of the changegroup.

182

183

deltachunk() is useful only if you're applying delta data. Most

183

deltachunk() is useful only if you're applying delta data. Most

184

consumers should prefer apply() instead.

184

consumers should prefer apply() instead.

185

186

A few other public methods exist. Those are used only for

186

A few other public methods exist. Those are used only for

187

bundlerepo and some debug commands - their use is discouraged.

187

bundlerepo and some debug commands - their use is discouraged.

188

"""

188

"""

189

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

189

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

190

deltaheadersize = struct.calcsize(deltaheader)

190

deltaheadersize = struct.calcsize(deltaheader)

191

version = '01'

191

version = '01'

192

_grouplistcount = 1 # One list of files after the manifests

192

_grouplistcount = 1 # One list of files after the manifests

193

194

def __init__(self, fh, alg):

194

def __init__(self, fh, alg):

195

if alg == 'UN':

195

if alg == 'UN':

196

alg = None # get more modern without breaking too much

196

alg = None # get more modern without breaking too much

197

if not alg in util.decompressors:

197

if not alg in util.decompressors:

198

raise error.Abort(_('unknown stream compression type: %s')

198

raise error.Abort(_('unknown stream compression type: %s')

199

% alg)

199

% alg)

200

if alg == 'BZ':

200

if alg == 'BZ':

201

alg = '_truncatedBZ'

201

alg = '_truncatedBZ'

202

self._stream = util.decompressors[alg](fh)

202

self._stream = util.decompressors[alg](fh)

203

self._type = alg

203

self._type = alg

204

self.callback = None

204

self.callback = None

205

206

# These methods (compressed, read, seek, tell) all appear to only

206

# These methods (compressed, read, seek, tell) all appear to only

207

# be used by bundlerepo, but it's a little hard to tell.

207

# be used by bundlerepo, but it's a little hard to tell.

208

def compressed(self):

208

def compressed(self):

209

return self._type is not None

209

return self._type is not None

210

def read(self, l):

210

def read(self, l):

211

return self._stream.read(l)

211

return self._stream.read(l)

212

def seek(self, pos):

212

def seek(self, pos):

213

return self._stream.seek(pos)

213

return self._stream.seek(pos)

214

def tell(self):

214

def tell(self):

215

return self._stream.tell()

215

return self._stream.tell()

216

def close(self):

216

def close(self):

217

return self._stream.close()

217

return self._stream.close()

218

219

def _chunklength(self):

219

def _chunklength(self):

220

d = readexactly(self._stream, 4)

220

d = readexactly(self._stream, 4)

221

l = struct.unpack(">l", d)[0]

221

l = struct.unpack(">l", d)[0]

222

if l <= 4:

222

if l <= 4:

223

if l:

223

if l:

224

raise error.Abort(_("invalid chunk length %d") % l)

224

raise error.Abort(_("invalid chunk length %d") % l)

225

return 0

225

return 0

226

if self.callback:

226

if self.callback:

227

self.callback()

227

self.callback()

228

return l - 4

228

return l - 4

229

230

def changelogheader(self):

230

def changelogheader(self):

231

"""v10 does not have a changelog header chunk"""

231

"""v10 does not have a changelog header chunk"""

232

return {}

232

return {}

233

234

def manifestheader(self):

234

def manifestheader(self):

235

"""v10 does not have a manifest header chunk"""

235

"""v10 does not have a manifest header chunk"""

236

return {}

236

return {}

237

238

def filelogheader(self):

238

def filelogheader(self):

239

"""return the header of the filelogs chunk, v10 only has the filename"""

239

"""return the header of the filelogs chunk, v10 only has the filename"""

240

l = self._chunklength()

240

l = self._chunklength()

241

if not l:

241

if not l:

242

return {}

242

return {}

243

fname = readexactly(self._stream, l)

243

fname = readexactly(self._stream, l)

244

return {'filename': fname}

244

return {'filename': fname}

245

246

def _deltaheader(self, headertuple, prevnode):

246

def _deltaheader(self, headertuple, prevnode):

247

node, p1, p2, cs = headertuple

247

node, p1, p2, cs = headertuple

248

if prevnode is None:

248

if prevnode is None:

249

deltabase = p1

249

deltabase = p1

250

else:

250

else:

251

deltabase = prevnode

251

deltabase = prevnode

252

flags = 0

252

flags = 0

253

return node, p1, p2, deltabase, cs, flags

253

return node, p1, p2, deltabase, cs, flags

254

255

def deltachunk(self, prevnode):

255

def deltachunk(self, prevnode):

256

l = self._chunklength()

256

l = self._chunklength()

257

if not l:

257

if not l:

258

return {}

258

return {}

259

headerdata = readexactly(self._stream, self.deltaheadersize)

259

headerdata = readexactly(self._stream, self.deltaheadersize)

260

header = struct.unpack(self.deltaheader, headerdata)

260

header = struct.unpack(self.deltaheader, headerdata)

261

delta = readexactly(self._stream, l - self.deltaheadersize)

261

delta = readexactly(self._stream, l - self.deltaheadersize)

262

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

262

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

263

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

263

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

264

'deltabase': deltabase, 'delta': delta, 'flags': flags}

264

'deltabase': deltabase, 'delta': delta, 'flags': flags}

265

266

def getchunks(self):

266

def getchunks(self):

267

"""returns all the chunks contains in the bundle

267

"""returns all the chunks contains in the bundle

268

269

Used when you need to forward the binary stream to a file or another

269

Used when you need to forward the binary stream to a file or another

270

network API. To do so, it parse the changegroup data, otherwise it will

270

network API. To do so, it parse the changegroup data, otherwise it will

271

block in case of sshrepo because it don't know the end of the stream.

271

block in case of sshrepo because it don't know the end of the stream.

272

"""

272

"""

273

# an empty chunkgroup is the end of the changegroup

273

# an empty chunkgroup is the end of the changegroup

274

# a changegroup has at least 2 chunkgroups (changelog and manifest).

274

# a changegroup has at least 2 chunkgroups (changelog and manifest).

275

# after that, changegroup versions 1 and 2 have a series of groups

275

# after that, changegroup versions 1 and 2 have a series of groups

276

# with one group per file. changegroup 3 has a series of directory

276

# with one group per file. changegroup 3 has a series of directory

277

# manifests before the files.

277

# manifests before the files.

278

count = 0

278

count = 0

279

emptycount = 0

279

emptycount = 0

280

while emptycount < self._grouplistcount:

280

while emptycount < self._grouplistcount:

281

empty = True

281

empty = True

282

count += 1

282

count += 1

283

while True:

283

while True:

284

chunk = getchunk(self)

284

chunk = getchunk(self)

285

if not chunk:

285

if not chunk:

286

if empty and count > 2:

286

if empty and count > 2:

287

emptycount += 1

287

emptycount += 1

288

break

288

break

289

empty = False

289

empty = False

290

yield chunkheader(len(chunk))

290

yield chunkheader(len(chunk))

291

pos = 0

291

pos = 0

292

while pos < len(chunk):

292

while pos < len(chunk):

293

next = pos + 2**20

293

next = pos + 2**20

294

yield chunk[pos:next]

294

yield chunk[pos:next]

295

pos = next

295

pos = next

296

yield closechunk()

296

yield closechunk()

297

298

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

298

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

299

# We know that we'll never have more manifests than we had

299

# We know that we'll never have more manifests than we had

300

# changesets.

300

# changesets.

301

self.callback = prog(_('manifests'), numchanges)

301

self.callback = prog(_('manifests'), numchanges)

302

# no need to check for empty manifest group here:

302

# no need to check for empty manifest group here:

303

# if the result of the merge of 1 and 2 is the same in 3 and 4,

303

# if the result of the merge of 1 and 2 is the same in 3 and 4,

304

# no new manifest will be created and the manifest group will

304

# no new manifest will be created and the manifest group will

305

# be empty during the pull

305

# be empty during the pull

306

self.manifestheader()

306

self.manifestheader()

307

repo.manifest.addgroup(self, revmap, trp)

307

repo.manifest.addgroup(self, revmap, trp)

308

repo.ui.progress(_('manifests'), None)

308

repo.ui.progress(_('manifests'), None)

309

310

def apply(self, repo, srctype, url, emptyok=False,

310

def apply(self, repo, srctype, url, emptyok=False,

311

targetphase=phases.draft, expectedtotal=None):

311

targetphase=phases.draft, expectedtotal=None):

312

"""Add the changegroup returned by source.read() to this repo.

312

"""Add the changegroup returned by source.read() to this repo.

313

srctype is a string like 'push', 'pull', or 'unbundle'. url is

313

srctype is a string like 'push', 'pull', or 'unbundle'. url is

314

the URL of the repo where this changegroup is coming from.

314

the URL of the repo where this changegroup is coming from.

315

316

Return an integer summarizing the change to this repo:

316

Return an integer summarizing the change to this repo:

317

- nothing changed or no source: 0

317

- nothing changed or no source: 0

318

- more heads than before: 1+added heads (2..n)

318

- more heads than before: 1+added heads (2..n)

319

- fewer heads than before: -1-removed heads (-2..-n)

319

- fewer heads than before: -1-removed heads (-2..-n)

320

- number of heads stays the same: 1

320

- number of heads stays the same: 1

321

"""

321

"""

322

repo = repo.unfiltered()

322

repo = repo.unfiltered()

323

def csmap(x):

323

def csmap(x):

324

repo.ui.debug("add changeset %s\n" % short(x))

324

repo.ui.debug("add changeset %s\n" % short(x))

325

return len(cl)

325

return len(cl)

326

327

def revmap(x):

327

def revmap(x):

328

return cl.rev(x)

328

return cl.rev(x)

329

330

changesets = files = revisions = 0

330

changesets = files = revisions = 0

331

332

try:

332

try:

333

with repo.transaction("\n".join([srctype,

333

with repo.transaction("\n".join([srctype,

334

util.hidepassword(url)])) as tr:

334

util.hidepassword(url)])) as tr:

335

# The transaction could have been created before and already

335

# The transaction could have been created before and already

336

# carries source information. In this case we use the top

336

# carries source information. In this case we use the top

337

# level data. We overwrite the argument because we need to use

337

# level data. We overwrite the argument because we need to use

338

# the top level value (if they exist) in this function.

338

# the top level value (if they exist) in this function.

339

srctype = tr.hookargs.setdefault('source', srctype)

339

srctype = tr.hookargs.setdefault('source', srctype)

340

url = tr.hookargs.setdefault('url', url)

340

url = tr.hookargs.setdefault('url', url)

341

repo.hook('prechangegroup', throw=True, **tr.hookargs)

341

repo.hook('prechangegroup', throw=True, **tr.hookargs)

342

343

# write changelog data to temp files so concurrent readers

343

# write changelog data to temp files so concurrent readers

344

# will not see an inconsistent view

344

# will not see an inconsistent view

345

cl = repo.changelog

345

cl = repo.changelog

346

cl.delayupdate(tr)

346

cl.delayupdate(tr)

347

oldheads = cl.heads()

347

oldheads = cl.heads()

348

349

trp = weakref.proxy(tr)

349

trp = weakref.proxy(tr)

350

# pull off the changeset group

350

# pull off the changeset group

351

repo.ui.status(_("adding changesets\n"))

351

repo.ui.status(_("adding changesets\n"))

352

clstart = len(cl)

352

clstart = len(cl)

353

class prog(object):

353

class prog(object):

354

def __init__(self, step, total):

354

def __init__(self, step, total):

355

self._step = step

355

self._step = step

356

self._total = total

356

self._total = total

357

self._count = 1

357

self._count = 1

358

def __call__(self):

358

def __call__(self):

359

repo.ui.progress(self._step, self._count,

359

repo.ui.progress(self._step, self._count,

360

unit=_('chunks'), total=self._total)

360

unit=_('chunks'), total=self._total)

361

self._count += 1

361

self._count += 1

362

self.callback = prog(_('changesets'), expectedtotal)

362

self.callback = prog(_('changesets'), expectedtotal)

363

364

efiles = set()

364

efiles = set()

365

def onchangelog(cl, node):

365

def onchangelog(cl, node):

366

efiles.update(cl.read(node)[3])

366

efiles.update(cl.read(node)[3])

367

368

self.changelogheader()

368

self.changelogheader()

369

srccontent = cl.addgroup(self, csmap, trp,

369

srccontent = cl.addgroup(self, csmap, trp,

370

addrevisioncb=onchangelog)

370

addrevisioncb=onchangelog)

371

efiles = len(efiles)

371

efiles = len(efiles)

372

373

if not (srccontent or emptyok):

373

if not (srccontent or emptyok):

374

raise error.Abort(_("received changelog group is empty"))

374

raise error.Abort(_("received changelog group is empty"))

375

clend = len(cl)

375

clend = len(cl)

376

changesets = clend - clstart

376

changesets = clend - clstart

377

repo.ui.progress(_('changesets'), None)

377

repo.ui.progress(_('changesets'), None)

378

379

# pull off the manifest group

379

# pull off the manifest group

380

repo.ui.status(_("adding manifests\n"))

380

repo.ui.status(_("adding manifests\n"))

381

self._unpackmanifests(repo, revmap, trp, prog, changesets)

381

self._unpackmanifests(repo, revmap, trp, prog, changesets)

382

383

needfiles = {}

383

needfiles = {}

384

if repo.ui.configbool('server', 'validate', default=False):

384

if repo.ui.configbool('server', 'validate', default=False):

385

# validate incoming csets have their manifests

385

# validate incoming csets have their manifests

386

for cset in xrange(clstart, clend):

386

for cset in xrange(clstart, clend):

387

mfnode = repo.changelog.read(

387

mfnode = repo.changelog.read(

388

repo.changelog.node(cset))[0]

388

repo.changelog.node(cset))[0]

389

mfest = repo.manifest.readdelta(mfnode)

389

mfest = repo.manifest.readdelta(mfnode)

390

# store file nodes we must see

390

# store file nodes we must see

391

for f, n in mfest.iteritems():

391

for f, n in mfest.iteritems():

392

needfiles.setdefault(f, set()).add(n)

392

needfiles.setdefault(f, set()).add(n)

393

394

# process the files

394

# process the files

395

repo.ui.status(_("adding file changes\n"))

395

repo.ui.status(_("adding file changes\n"))

396

self.callback = None

396

self.callback = None

397

pr = prog(_('files'), efiles)

397

pr = prog(_('files'), efiles)

398

newrevs, newfiles = _addchangegroupfiles(

398

newrevs, newfiles = _addchangegroupfiles(

399

repo, self, revmap, trp, pr, needfiles)

399

repo, self, revmap, trp, pr, needfiles)

400

revisions += newrevs

400

revisions += newrevs

401

files += newfiles

401

files += newfiles

402

403

dh = 0

403

dh = 0

404

if oldheads:

404

if oldheads:

405

heads = cl.heads()

405

heads = cl.heads()

406

dh = len(heads) - len(oldheads)

406

dh = len(heads) - len(oldheads)

407

for h in heads:

407

for h in heads:

408

if h not in oldheads and repo[h].closesbranch():

408

if h not in oldheads and repo[h].closesbranch():

409

dh -= 1

409

dh -= 1

410

htext = ""

410

htext = ""

411

if dh:

411

if dh:

412

htext = _(" (%+d heads)") % dh

412

htext = _(" (%+d heads)") % dh

413

414

repo.ui.status(_("added %d changesets"

414

repo.ui.status(_("added %d changesets"

415

" with %d changes to %d files%s\n")

415

" with %d changes to %d files%s\n")

416

% (changesets, revisions, files, htext))

416

% (changesets, revisions, files, htext))

417

repo.invalidatevolatilesets()

417

repo.invalidatevolatilesets()

418

419

if changesets > 0:

419

if changesets > 0:

420

if 'node' not in tr.hookargs:

420

if 'node' not in tr.hookargs:

421

tr.hookargs['node'] = hex(cl.node(clstart))

421

tr.hookargs['node'] = hex(cl.node(clstart))

422

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

422

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

423

hookargs = dict(tr.hookargs)

423

hookargs = dict(tr.hookargs)

424

else:

424

else:

425

hookargs = dict(tr.hookargs)

425

hookargs = dict(tr.hookargs)

426

hookargs['node'] = hex(cl.node(clstart))

426

hookargs['node'] = hex(cl.node(clstart))

427

hookargs['node_last'] = hex(cl.node(clend - 1))

427

hookargs['node_last'] = hex(cl.node(clend - 1))

428

repo.hook('pretxnchangegroup', throw=True, **hookargs)

428

repo.hook('pretxnchangegroup', throw=True, **hookargs)

429

430

added = [cl.node(r) for r in xrange(clstart, clend)]

430

added = [cl.node(r) for r in xrange(clstart, clend)]

431

publishing = repo.publishing()

431

publishing = repo.publishing()

432

if srctype in ('push', 'serve'):

432

if srctype in ('push', 'serve'):

433

# Old servers can not push the boundary themselves.

433

# Old servers can not push the boundary themselves.

434

# New servers won't push the boundary if changeset already

434

# New servers won't push the boundary if changeset already

435

# exists locally as secret

435

# exists locally as secret

436

#

436

#

437

# We should not use added here but the list of all change in

437

# We should not use added here but the list of all change in

438

# the bundle

438

# the bundle

439

if publishing:

439

if publishing:

440

phases.advanceboundary(repo, tr, phases.public,

440

phases.advanceboundary(repo, tr, phases.public,

441

srccontent)

441

srccontent)

442

else:

442

else:

443

# Those changesets have been pushed from the

443

# Those changesets have been pushed from the

444

# outside, their phases are going to be pushed

444

# outside, their phases are going to be pushed

445

# alongside. Therefor `targetphase` is

445

# alongside. Therefor `targetphase` is

446

# ignored.

446

# ignored.

447

phases.advanceboundary(repo, tr, phases.draft,

447

phases.advanceboundary(repo, tr, phases.draft,

448

srccontent)

448

srccontent)

449

phases.retractboundary(repo, tr, phases.draft, added)

449

phases.retractboundary(repo, tr, phases.draft, added)

450

elif srctype != 'strip':

450

elif srctype != 'strip':

451

# publishing only alter behavior during push

451

# publishing only alter behavior during push

452

#

452

#

453

# strip should not touch boundary at all

453

# strip should not touch boundary at all

454

phases.retractboundary(repo, tr, targetphase, added)

454

phases.retractboundary(repo, tr, targetphase, added)

455

456

if changesets > 0:

456

if changesets > 0:

457

if srctype != 'strip':

457

if srctype != 'strip':

458

# During strip, branchcache is invalid but

458

# During strip, branchcache is invalid but

459

# coming call to `destroyed` will repair it.

459

# coming call to `destroyed` will repair it.

460

# In other case we can safely update cache on

460

# In other case we can safely update cache on

461

# disk.

461

# disk.

462

branchmap.updatecache(repo.filtered('served'))

462

branchmap.updatecache(repo.filtered('served'))

463

464

def runhooks():

464

def runhooks():

465

# These hooks run when the lock releases, not when the

465

# These hooks run when the lock releases, not when the

466

# transaction closes. So it's possible for the changelog

466

# transaction closes. So it's possible for the changelog

467

# to have changed since we last saw it.

467

# to have changed since we last saw it.

468

if clstart >= len(repo):

468

if clstart >= len(repo):

469

return

469

return

470

471

# forcefully update the on-disk branch cache

471

# forcefully update the on-disk branch cache

472

repo.ui.debug("updating the branch cache\n")

472

repo.ui.debug("updating the branch cache\n")

473

repo.hook("changegroup", **hookargs)

473

repo.hook("changegroup", **hookargs)

474

475

for n in added:

475

for n in added:

476

args = hookargs.copy()

476

args = hookargs.copy()

477

args['node'] = hex(n)

477

args['node'] = hex(n)

478

del args['node_last']

478

del args['node_last']

479

repo.hook("incoming", **args)

479

repo.hook("incoming", **args)

480

481

newheads = [h for h in repo.heads()

481

newheads = [h for h in repo.heads()

482

if h not in oldheads]

482

if h not in oldheads]

483

repo.ui.log("incoming",

483

repo.ui.log("incoming",

484

"%s incoming changes - new heads: %s\n",

484

"%s incoming changes - new heads: %s\n",

485

len(added),

485

len(added),

486

', '.join([hex(c[:6]) for c in newheads]))

486

', '.join([hex(c[:6]) for c in newheads]))

487

488

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

488

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

489

lambda tr: repo._afterlock(runhooks))

489

lambda tr: repo._afterlock(runhooks))

490

finally:

490

finally:

491

repo.ui.flush()

491

repo.ui.flush()

492

# never return 0 here:

492

# never return 0 here:

493

if dh < 0:

493

if dh < 0:

494

return dh - 1

494

return dh - 1

495

else:

495

else:

496

return dh + 1

496

return dh + 1

497

498

class cg2unpacker(cg1unpacker):

498

class cg2unpacker(cg1unpacker):

499

"""Unpacker for cg2 streams.

499

"""Unpacker for cg2 streams.

500

501

cg2 streams add support for generaldelta, so the delta header

501

cg2 streams add support for generaldelta, so the delta header

502

format is slightly different. All other features about the data

502

format is slightly different. All other features about the data

503

remain the same.

503

remain the same.

504

"""

504

"""

505

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

505

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

506

deltaheadersize = struct.calcsize(deltaheader)

506

deltaheadersize = struct.calcsize(deltaheader)

507

version = '02'

507

version = '02'

508

509

def _deltaheader(self, headertuple, prevnode):

509

def _deltaheader(self, headertuple, prevnode):

510

node, p1, p2, deltabase, cs = headertuple

510

node, p1, p2, deltabase, cs = headertuple

511

flags = 0

511

flags = 0

512

return node, p1, p2, deltabase, cs, flags

512

return node, p1, p2, deltabase, cs, flags

513

514

class cg3unpacker(cg2unpacker):

514

class cg3unpacker(cg2unpacker):

515

"""Unpacker for cg3 streams.

515

"""Unpacker for cg3 streams.

516

517

cg3 streams add support for exchanging treemanifests and revlog

517

cg3 streams add support for exchanging treemanifests and revlog

518

flags. It adds the revlog flags to the delta header and an empty chunk

518

flags. It adds the revlog flags to the delta header and an empty chunk

519

separating manifests and files.

519

separating manifests and files.

520

"""

520

"""

521

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

521

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

522

deltaheadersize = struct.calcsize(deltaheader)

522

deltaheadersize = struct.calcsize(deltaheader)

523

version = '03'

523

version = '03'

524

_grouplistcount = 2 # One list of manifests and one list of files

524

_grouplistcount = 2 # One list of manifests and one list of files

525

526

def _deltaheader(self, headertuple, prevnode):

526

def _deltaheader(self, headertuple, prevnode):

527

node, p1, p2, deltabase, cs, flags = headertuple

527

node, p1, p2, deltabase, cs, flags = headertuple

528

return node, p1, p2, deltabase, cs, flags

528

return node, p1, p2, deltabase, cs, flags

529

530

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

530

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

531

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,

531

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,

532

numchanges)

532

numchanges)

533

while True:

533

while True:

534

chunkdata = self.filelogheader()

534

chunkdata = self.filelogheader()

535

if not chunkdata:

535

if not chunkdata:

536

break

536

break

537

# If we get here, there are directory manifests in the changegroup

537

# If we get here, there are directory manifests in the changegroup

538

d = chunkdata["filename"]

538

d = chunkdata["filename"]

539

repo.ui.debug("adding %s revisions\n" % d)

539

repo.ui.debug("adding %s revisions\n" % d)

540

dirlog = repo.manifest.dirlog(d)

540

dirlog = repo.manifest.dirlog(d)

541

if not dirlog.addgroup(self, revmap, trp):

541

if not dirlog.addgroup(self, revmap, trp):

542

raise error.Abort(_("received dir revlog group is empty"))

542

raise error.Abort(_("received dir revlog group is empty"))

543

544

class headerlessfixup(object):

544

class headerlessfixup(object):

545

def __init__(self, fh, h):

545

def __init__(self, fh, h):

546

self._h = h

546

self._h = h

547

self._fh = fh

547

self._fh = fh

548

def read(self, n):

548

def read(self, n):

549

if self._h:

549

if self._h:

550

d, self._h = self._h[:n], self._h[n:]

550

d, self._h = self._h[:n], self._h[n:]

551

if len(d) < n:

551

if len(d) < n:

552

d += readexactly(self._fh, n - len(d))

552

d += readexactly(self._fh, n - len(d))

553

return d

553

return d

554

return readexactly(self._fh, n)

554

return readexactly(self._fh, n)

555

556

def _moddirs(files):

556

def _moddirs(files):

557

"""Given a set of modified files, find the list of modified directories.

557

"""Given a set of modified files, find the list of modified directories.

558

559

This returns a list of (path to changed dir, changed dir) tuples,

559

This returns a list of (path to changed dir, changed dir) tuples,

560

as that's what the one client needs anyway.

560

as that's what the one client needs anyway.

561

562

>>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])

562

>>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])

563

[('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]

563

[('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]

564

565

"""

565

"""

566

alldirs = set()

566

alldirs = set()

567

for f in files:

567

for f in files:

568

path = f.split('/')[:-1]

568

path = f.split('/')[:-1]

569

for i in xrange(len(path) - 1, -1, -1):

569

for i in xrange(len(path) - 1, -1, -1):

570

dn = '/'.join(path[:i])

570

dn = '/'.join(path[:i])

571

current = dn + '/', path[i] + '/'

571

current = dn + '/', path[i] + '/'

572

if current in alldirs:

572

if current in alldirs:

573

break

573

break

574

alldirs.add(current)

574

alldirs.add(current)

575

return sorted(alldirs)

575

return sorted(alldirs)

576

577

class cg1packer(object):

577

class cg1packer(object):

578

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

578

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

579

version = '01'

579

version = '01'

580

def __init__(self, repo, bundlecaps=None):

580

def __init__(self, repo, bundlecaps=None):

581

"""Given a source repo, construct a bundler.

581

"""Given a source repo, construct a bundler.

582

583

bundlecaps is optional and can be used to specify the set of

583

bundlecaps is optional and can be used to specify the set of

584

capabilities which can be used to build the bundle.

584

capabilities which can be used to build the bundle.

585

"""

585

"""

586

# Set of capabilities we can use to build the bundle.

586

# Set of capabilities we can use to build the bundle.

587

if bundlecaps is None:

587

if bundlecaps is None:

588

bundlecaps = set()

588

bundlecaps = set()

589

self._bundlecaps = bundlecaps

589

self._bundlecaps = bundlecaps

590

# experimental config: bundle.reorder

590

# experimental config: bundle.reorder

591

reorder = repo.ui.config('bundle', 'reorder', 'auto')

591

reorder = repo.ui.config('bundle', 'reorder', 'auto')

592

if reorder == 'auto':

592

if reorder == 'auto':

593

reorder = None

593

reorder = None

594

else:

594

else:

595

reorder = util.parsebool(reorder)

595

reorder = util.parsebool(reorder)

596

self._repo = repo

596

self._repo = repo

597

self._reorder = reorder

597

self._reorder = reorder

598

self._progress = repo.ui.progress

598

self._progress = repo.ui.progress

599

if self._repo.ui.verbose and not self._repo.ui.debugflag:

599

if self._repo.ui.verbose and not self._repo.ui.debugflag:

600

self._verbosenote = self._repo.ui.note

600

self._verbosenote = self._repo.ui.note

601

else:

601

else:

602

self._verbosenote = lambda s: None

602

self._verbosenote = lambda s: None

603

604

def close(self):

604

def close(self):

605

return closechunk()

605

return closechunk()

606

607

def fileheader(self, fname):

607

def fileheader(self, fname):

608

return chunkheader(len(fname)) + fname

608

return chunkheader(len(fname)) + fname

609

610

def group(self, nodelist, revlog, lookup, units=None):

610

def group(self, nodelist, revlog, lookup, units=None):

611

"""Calculate a delta group, yielding a sequence of changegroup chunks

611

"""Calculate a delta group, yielding a sequence of changegroup chunks

612

(strings).

612

(strings).

613

614

Given a list of changeset revs, return a set of deltas and

614

Given a list of changeset revs, return a set of deltas and

615

metadata corresponding to nodes. The first delta is

615

metadata corresponding to nodes. The first delta is

616

first parent(nodelist[0]) -> nodelist[0], the receiver is

616

first parent(nodelist[0]) -> nodelist[0], the receiver is

617

guaranteed to have this parent as it has all history before

617

guaranteed to have this parent as it has all history before

618

these changesets. In the case firstparent is nullrev the

618

these changesets. In the case firstparent is nullrev the

619

changegroup starts with a full revision.

619

changegroup starts with a full revision.

620

621

If units is not None, progress detail will be generated, units specifies

621

If units is not None, progress detail will be generated, units specifies

622

the type of revlog that is touched (changelog, manifest, etc.).

622

the type of revlog that is touched (changelog, manifest, etc.).

623

"""

623

"""

624

# if we don't have any revisions touched by these changesets, bail

624

# if we don't have any revisions touched by these changesets, bail

625

if len(nodelist) == 0:

625

if len(nodelist) == 0:

626

yield self.close()

626

yield self.close()

627

return

627

return

628

629

# for generaldelta revlogs, we linearize the revs; this will both be

629

# for generaldelta revlogs, we linearize the revs; this will both be

630

# much quicker and generate a much smaller bundle

630

# much quicker and generate a much smaller bundle

631

if (revlog._generaldelta and self._reorder is None) or self._reorder:

631

if (revlog._generaldelta and self._reorder is None) or self._reorder:

632

dag = dagutil.revlogdag(revlog)

632

dag = dagutil.revlogdag(revlog)

633

revs = set(revlog.rev(n) for n in nodelist)

633

revs = set(revlog.rev(n) for n in nodelist)

634

revs = dag.linearize(revs)

634

revs = dag.linearize(revs)

635

else:

635

else:

636

revs = sorted([revlog.rev(n) for n in nodelist])

636

revs = sorted([revlog.rev(n) for n in nodelist])

637

638

# add the parent of the first rev

638

# add the parent of the first rev

639

p = revlog.parentrevs(revs[0])[0]

639

p = revlog.parentrevs(revs[0])[0]

640

revs.insert(0, p)

640

revs.insert(0, p)

641

642

# build deltas

642

# build deltas

643

total = len(revs) - 1

643

total = len(revs) - 1

644

msgbundling = _('bundling')

644

msgbundling = _('bundling')

645

for r in xrange(len(revs) - 1):

645

for r in xrange(len(revs) - 1):

646

if units is not None:

646

if units is not None:

647

self._progress(msgbundling, r + 1, unit=units, total=total)

647

self._progress(msgbundling, r + 1, unit=units, total=total)

648

prev, curr = revs[r], revs[r + 1]

648

prev, curr = revs[r], revs[r + 1]

649

linknode = lookup(revlog.node(curr))

649

linknode = lookup(revlog.node(curr))

650

for c in self.revchunk(revlog, curr, prev, linknode):

650

for c in self.revchunk(revlog, curr, prev, linknode):

651

yield c

651

yield c

652

653

if units is not None:

653

if units is not None:

654

self._progress(msgbundling, None)

654

self._progress(msgbundling, None)

655

yield self.close()

655

yield self.close()

656

657

# filter any nodes that claim to be part of the known set

657

# filter any nodes that claim to be part of the known set

658

def prune(self, revlog, missing, commonrevs):

658

def prune(self, revlog, missing, commonrevs):

659

rr, rl = revlog.rev, revlog.linkrev

659

rr, rl = revlog.rev, revlog.linkrev

660

return [n for n in missing if rl(rr(n)) not in commonrevs]

660

return [n for n in missing if rl(rr(n)) not in commonrevs]

661

662

def _packmanifests(self, dir, mfnodes, lookuplinknode):

662

def _packmanifests(self, dir, mfnodes, lookuplinknode):

663

"""Pack flat manifests into a changegroup stream."""

663

"""Pack flat manifests into a changegroup stream."""

664

assert not dir

664

assert not dir

665

for chunk in self.group(mfnodes, self._repo.manifest,

665

for chunk in self.group(mfnodes, self._repo.manifest,

666

lookuplinknode, units=_('manifests')):

666

lookuplinknode, units=_('manifests')):

667

yield chunk

667

yield chunk

668

669

def _manifestsdone(self):

669

def _manifestsdone(self):

670

return ''

670

return ''

671

672

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

672

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

673

'''yield a sequence of changegroup chunks (strings)'''

673

'''yield a sequence of changegroup chunks (strings)'''

674

repo = self._repo

674

repo = self._repo

675

cl = repo.changelog

675

cl = repo.changelog

676

677

clrevorder = {}

677

clrevorder = {}

678

mfs = {} # needed manifests

678

mfs = {} # needed manifests

679

fnodes = {} # needed file nodes

679

fnodes = {} # needed file nodes

680

# maps manifest node id -> set(changed files)

680

# maps manifest node id -> set(changed files)

681

mfchangedfiles = {}

681

mfchangedfiles = {}

682

683

# Callback for the changelog, used to collect changed files and manifest

683

# Callback for the changelog, used to collect changed files and manifest

684

# nodes.

684

# nodes.

685

# Returns the linkrev node (identity in the changelog case).

685

# Returns the linkrev node (identity in the changelog case).

686

def lookupcl(x):

686

def lookupcl(x):

687

c = cl.read(x)

687

c = cl.read(x)

688

clrevorder[x] = len(clrevorder)

688

clrevorder[x] = len(clrevorder)

689

n = c[0]

689

n = c[0]

690

# record the first changeset introducing this manifest version

690

# record the first changeset introducing this manifest version

691

mfs.setdefault(n, x)

691

mfs.setdefault(n, x)

692

# Record a complete list of potentially-changed files in

692

# Record a complete list of potentially-changed files in

693

# this manifest.

693

# this manifest.

694

mfchangedfiles.setdefault(n, set()).update(c[3])

694

mfchangedfiles.setdefault(n, set()).update(c[3])

695

return x

695

return x

696

697

self._verbosenote(_('uncompressed size of bundle content:\n'))

697

self._verbosenote(_('uncompressed size of bundle content:\n'))

698

size = 0

698

size = 0

699

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

699

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

700

size += len(chunk)

700

size += len(chunk)

701

yield chunk

701

yield chunk

702

self._verbosenote(_('%8.i (changelog)\n') % size)

702

self._verbosenote(_('%8.i (changelog)\n') % size)

703

704

# We need to make sure that the linkrev in the changegroup refers to

704

# We need to make sure that the linkrev in the changegroup refers to

705

# the first changeset that introduced the manifest or file revision.

705

# the first changeset that introduced the manifest or file revision.

706

# The fastpath is usually safer than the slowpath, because the filelogs

706

# The fastpath is usually safer than the slowpath, because the filelogs

707

# are walked in revlog order.

707

# are walked in revlog order.

708

#

708

#

709

# When taking the slowpath with reorder=None and the manifest revlog

709

# When taking the slowpath with reorder=None and the manifest revlog

710

# uses generaldelta, the manifest may be walked in the "wrong" order.

710

# uses generaldelta, the manifest may be walked in the "wrong" order.

711

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

711

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

712

# cc0ff93d0c0c).

712

# cc0ff93d0c0c).

713

#

713

#

714

# When taking the fastpath, we are only vulnerable to reordering

714

# When taking the fastpath, we are only vulnerable to reordering

715

# of the changelog itself. The changelog never uses generaldelta, so

715

# of the changelog itself. The changelog never uses generaldelta, so

716

# it is only reordered when reorder=True. To handle this case, we

716

# it is only reordered when reorder=True. To handle this case, we

717

# simply take the slowpath, which already has the 'clrevorder' logic.

717

# simply take the slowpath, which already has the 'clrevorder' logic.

718

# This was also fixed in cc0ff93d0c0c.

718

# This was also fixed in cc0ff93d0c0c.

719

fastpathlinkrev = fastpathlinkrev and not self._reorder

719

fastpathlinkrev = fastpathlinkrev and not self._reorder

720

# Treemanifests don't work correctly with fastpathlinkrev

720

# Treemanifests don't work correctly with fastpathlinkrev

721

# either, because we don't discover which directory nodes to

721

# either, because we don't discover which directory nodes to

722

# send along with files. This could probably be fixed.

722

# send along with files. This could probably be fixed.

723

fastpathlinkrev = fastpathlinkrev and (

723

fastpathlinkrev = fastpathlinkrev and (

724

'treemanifest' not in repo.requirements)

724

'treemanifest' not in repo.requirements)

725

726

for chunk in self.generatemanifests(commonrevs, clrevorder,

726

for chunk in self.generatemanifests(commonrevs, clrevorder,

727

fastpathlinkrev, mfs, mfchangedfiles, fnodes):

727

fastpathlinkrev, mfs, mfchangedfiles, fnodes):

728

yield chunk

728

yield chunk

729

mfs.clear()

729

mfs.clear()

730

clrevs = set(cl.rev(x) for x in clnodes)

730

clrevs = set(cl.rev(x) for x in clnodes)

731

732

if not fastpathlinkrev:

732

if not fastpathlinkrev:

733

def linknodes(unused, fname):

733

def linknodes(unused, fname):

734

return fnodes.get(fname, {})

734

return fnodes.get(fname, {})

735

else:

735

else:

736

cln = cl.node

736

cln = cl.node

737

def linknodes(filerevlog, fname):

737

def linknodes(filerevlog, fname):

738

llr = filerevlog.linkrev

738

llr = filerevlog.linkrev

739

fln = filerevlog.node

739

fln = filerevlog.node

740

revs = ((r, llr(r)) for r in filerevlog)

740

revs = ((r, llr(r)) for r in filerevlog)

741

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

741

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

742

743

changedfiles = set()

743

changedfiles = set()

744

for x in mfchangedfiles.itervalues():

744

for x in mfchangedfiles.itervalues():

745

changedfiles.update(x)

745

changedfiles.update(x)

746

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

746

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

747

source):

747

source):

748

yield chunk

748

yield chunk

749

750

yield self.close()

750

yield self.close()

751

752

if clnodes:

752

if clnodes:

753

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

753

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

754

755

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

755

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

756

mfchangedfiles, fnodes):

756

mfchangedfiles, fnodes):

757

repo = self._repo

757

repo = self._repo

758

ml = repo.manifest

758

ml = repo.manifest

759

tmfnodes = {}

759

tmfnodes = {'': mfs}

760

761

# Callback for the manifest, used to collect linkrevs for filelog

761

# Callback for the manifest, used to collect linkrevs for filelog

762

# revisions.

762

# revisions.

763

# Returns the linkrev node (collected in lookupcl).

763

# Returns the linkrev node (collected in lookupcl).

764

def makelookupmflinknode(dir):

764

def makelookupmflinknode(dir):

765

if fastpathlinkrev:

765

if fastpathlinkrev:

766

assert not dir

766

assert not dir

767

return mfs.__getitem__

767

return mfs.__getitem__

768

769

if dir:

769

if dir:

770

return tmfnodes[dir].get

770

return tmfnodes[dir].get

771

772

def lookupmflinknode(x):

772

def lookupmflinknode(x):

773

"""Callback for looking up the linknode for manifests.

773

"""Callback for looking up the linknode for manifests.

774

775

Returns the linkrev node for the specified manifest.

775

Returns the linkrev node for the specified manifest.

776

777

SIDE EFFECT:

777

SIDE EFFECT:

778

779

1) fclnodes gets populated with the list of relevant

779

1) fclnodes gets populated with the list of relevant

780

file nodes if we're not using fastpathlinkrev

780

file nodes if we're not using fastpathlinkrev

781

2) When treemanifests are in use, collects treemanifest nodes

781

2) When treemanifests are in use, collects treemanifest nodes

782

to send

782

to send

783

784

Note that this means manifests must be completely sent to

784

Note that this means manifests must be completely sent to

785

the client before you can trust the list of files and

785

the client before you can trust the list of files and

786

treemanifests to send.

786

treemanifests to send.

787

"""

787

"""

788

clnode = mfs[x]

788

clnode = mfs[x]

789

# We no longer actually care about reading deltas of

789

# We no longer actually care about reading deltas of

790

# the manifest here, because we already know the list

790

# the manifest here, because we already know the list

791

# of changed files, so for treemanifests (which

791

# of changed files, so for treemanifests (which

792

# lazily-load anyway to *generate* a readdelta) we can

792

# lazily-load anyway to *generate* a readdelta) we can

793

# just load them with read() and then we'll actually

793

# just load them with read() and then we'll actually

794

# be able to correctly load node IDs from the

794

# be able to correctly load node IDs from the

795

# submanifest entries.

795

# submanifest entries.

796

if 'treemanifest' in repo.requirements:

796

if 'treemanifest' in repo.requirements:

797

mdata = ml.read(x)

797

mdata = ml.read(x)

798

else:

798

else:

799

mdata = ml.readfast(x)

799

mdata = ml.readfast(x)

800

for f in mfchangedfiles[x]:

800

for f in mfchangedfiles[x]:

801

try:

801

try:

802

n = mdata[f]

802

n = mdata[f]

803

except KeyError:

803

except KeyError:

804

continue

804

continue

805

# record the first changeset introducing this filelog

805

# record the first changeset introducing this filelog

806

# version

806

# version

807

fclnodes = fnodes.setdefault(f, {})

807

fclnodes = fnodes.setdefault(f, {})

808

fclnode = fclnodes.setdefault(n, clnode)

808

fclnode = fclnodes.setdefault(n, clnode)

809

if clrevorder[clnode] < clrevorder[fclnode]:

809

if clrevorder[clnode] < clrevorder[fclnode]:

810

fclnodes[n] = clnode

810

fclnodes[n] = clnode

811

# gather list of changed treemanifest nodes

811

# gather list of changed treemanifest nodes

812

if 'treemanifest' in repo.requirements:

812

if 'treemanifest' in repo.requirements:

813

submfs = {'/': mdata}

813

submfs = {'/': mdata}

814

for dn, bn in _moddirs(mfchangedfiles[x]):

814

for dn, bn in _moddirs(mfchangedfiles[x]):

815

try:

815

try:

816

submf = submfs[dn]

816

submf = submfs[dn]

817

submf = submf._dirs[bn]

817

submf = submf._dirs[bn]

818

except KeyError:

818

except KeyError:

819

continue # deleted directory, so nothing to send

819

continue # deleted directory, so nothing to send

820

submfs[submf.dir()] = submf

820

submfs[submf.dir()] = submf

821

tmfclnodes = tmfnodes.setdefault(submf.dir(), {})

821

tmfclnodes = tmfnodes.setdefault(submf.dir(), {})

822

tmfclnode = tmfclnodes.setdefault(submf._node, clnode)

822

tmfclnode = tmfclnodes.setdefault(submf._node, clnode)

823

if clrevorder[clnode] < clrevorder[tmfclnode]:

823

if clrevorder[clnode] < clrevorder[tmfclnode]:

824

tmfclnodes[n] = clnode

824

tmfclnodes[n] = clnode

825

return clnode

825

return clnode

826

return lookupmflinknode

826

return lookupmflinknode

827

828

mfnodes = self.prune(ml, mfs, commonrevs)

829

size = 0

828

size = 0

830

for x in self._packmanifests('', mfnodes, makelookupmflinknode('')):

829

while tmfnodes:

831

~~size~~ += len(x)

830

dir = min(tmfnodes)

832

yield x

831

nodes = tmfnodes[dir]

833

for dir, nodes in tmfnodes.iteritems():

834

prunednodes = self.prune(ml.dirlog(dir), nodes, commonrevs)

832

prunednodes = self.prune(ml.dirlog(dir), nodes, commonrevs)

835

for x in self._packmanifests(dir, prunednodes,

833

for x in self._packmanifests(dir, prunednodes,

836

makelookupmflinknode(dir)):

834

makelookupmflinknode(dir)):

837

size += len(x)

835

size += len(x)

838

yield x

836

yield x

837

del tmfnodes[dir]

839

self._verbosenote(_('%8.i (manifests)\n') % size)

838

self._verbosenote(_('%8.i (manifests)\n') % size)

840

yield self._manifestsdone()

839

yield self._manifestsdone()

841

840

842

# The 'source' parameter is useful for extensions

841

# The 'source' parameter is useful for extensions

843

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

842

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

844

repo = self._repo

843

repo = self._repo

845

progress = self._progress

844

progress = self._progress

846

msgbundling = _('bundling')

845

msgbundling = _('bundling')

847

846

848

total = len(changedfiles)

847

total = len(changedfiles)

849

# for progress output

848

# for progress output

850

msgfiles = _('files')

849

msgfiles = _('files')

851

for i, fname in enumerate(sorted(changedfiles)):

850

for i, fname in enumerate(sorted(changedfiles)):

852

filerevlog = repo.file(fname)

851

filerevlog = repo.file(fname)

853

if not filerevlog:

852

if not filerevlog:

854

raise error.Abort(_("empty or missing revlog for %s") % fname)

853

raise error.Abort(_("empty or missing revlog for %s") % fname)

855

854

856

linkrevnodes = linknodes(filerevlog, fname)

855

linkrevnodes = linknodes(filerevlog, fname)

857

# Lookup for filenodes, we collected the linkrev nodes above in the

856

# Lookup for filenodes, we collected the linkrev nodes above in the

858

# fastpath case and with lookupmf in the slowpath case.

857

# fastpath case and with lookupmf in the slowpath case.

859

def lookupfilelog(x):

858

def lookupfilelog(x):

860

return linkrevnodes[x]

859

return linkrevnodes[x]

861

860

862

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

861

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

863

if filenodes:

862

if filenodes:

864

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

863

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

865

total=total)

864

total=total)

866

h = self.fileheader(fname)

865

h = self.fileheader(fname)

867

size = len(h)

866

size = len(h)

868

yield h

867

yield h

869

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

868

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

870

size += len(chunk)

869

size += len(chunk)

871

yield chunk

870

yield chunk

872

self._verbosenote(_('%8.i %s\n') % (size, fname))

871

self._verbosenote(_('%8.i %s\n') % (size, fname))

873

progress(msgbundling, None)

872

progress(msgbundling, None)

874

873

875

def deltaparent(self, revlog, rev, p1, p2, prev):

874

def deltaparent(self, revlog, rev, p1, p2, prev):

876

return prev

875

return prev

877

876

878

def revchunk(self, revlog, rev, prev, linknode):

877

def revchunk(self, revlog, rev, prev, linknode):

879

node = revlog.node(rev)

878

node = revlog.node(rev)

880

p1, p2 = revlog.parentrevs(rev)

879

p1, p2 = revlog.parentrevs(rev)

881

base = self.deltaparent(revlog, rev, p1, p2, prev)

880

base = self.deltaparent(revlog, rev, p1, p2, prev)

882

881

883

prefix = ''

882

prefix = ''

884

if revlog.iscensored(base) or revlog.iscensored(rev):

883

if revlog.iscensored(base) or revlog.iscensored(rev):

885

try:

884

try:

886

delta = revlog.revision(node)

885

delta = revlog.revision(node)

887

except error.CensoredNodeError as e:

886

except error.CensoredNodeError as e:

888

delta = e.tombstone

887

delta = e.tombstone

889

if base == nullrev:

888

if base == nullrev:

890

prefix = mdiff.trivialdiffheader(len(delta))

889

prefix = mdiff.trivialdiffheader(len(delta))

891

else:

890

else:

892

baselen = revlog.rawsize(base)

891

baselen = revlog.rawsize(base)

893

prefix = mdiff.replacediffheader(baselen, len(delta))

892

prefix = mdiff.replacediffheader(baselen, len(delta))

894

elif base == nullrev:

893

elif base == nullrev:

895

delta = revlog.revision(node)

894

delta = revlog.revision(node)

896

prefix = mdiff.trivialdiffheader(len(delta))

895

prefix = mdiff.trivialdiffheader(len(delta))

897

else:

896

else:

898

delta = revlog.revdiff(base, rev)

897

delta = revlog.revdiff(base, rev)

899

p1n, p2n = revlog.parents(node)

898

p1n, p2n = revlog.parents(node)

900

basenode = revlog.node(base)

899

basenode = revlog.node(base)

901

flags = revlog.flags(rev)

900

flags = revlog.flags(rev)

902

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)

901

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)

903

meta += prefix

902

meta += prefix

904

l = len(meta) + len(delta)

903

l = len(meta) + len(delta)

905

yield chunkheader(l)

904

yield chunkheader(l)

906

yield meta

905

yield meta

907

yield delta

906

yield delta

908

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

907

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

909

# do nothing with basenode, it is implicitly the previous one in HG10

908

# do nothing with basenode, it is implicitly the previous one in HG10

910

# do nothing with flags, it is implicitly 0 for cg1 and cg2

909

# do nothing with flags, it is implicitly 0 for cg1 and cg2

911

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

910

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

912

911

913

class cg2packer(cg1packer):

912

class cg2packer(cg1packer):

914

version = '02'

913

version = '02'

915

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

914

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

916

915

917

def __init__(self, repo, bundlecaps=None):

916

def __init__(self, repo, bundlecaps=None):

918

super(cg2packer, self).__init__(repo, bundlecaps)

917

super(cg2packer, self).__init__(repo, bundlecaps)

919

if self._reorder is None:

918

if self._reorder is None:

920

# Since generaldelta is directly supported by cg2, reordering

919

# Since generaldelta is directly supported by cg2, reordering

921

# generally doesn't help, so we disable it by default (treating

920

# generally doesn't help, so we disable it by default (treating

922

# bundle.reorder=auto just like bundle.reorder=False).

921

# bundle.reorder=auto just like bundle.reorder=False).

923

self._reorder = False

922

self._reorder = False

924

923

925

def deltaparent(self, revlog, rev, p1, p2, prev):

924

def deltaparent(self, revlog, rev, p1, p2, prev):

926

dp = revlog.deltaparent(rev)

925

dp = revlog.deltaparent(rev)

927

# avoid storing full revisions; pick prev in those cases

926

# avoid storing full revisions; pick prev in those cases

928

# also pick prev when we can't be sure remote has dp

927

# also pick prev when we can't be sure remote has dp

929

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

928

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

930

return prev

929

return prev

931

return dp

930

return dp

932

931

933

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

932

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

934

# Do nothing with flags, it is implicitly 0 in cg1 and cg2

933

# Do nothing with flags, it is implicitly 0 in cg1 and cg2

935

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

934

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

936

935

937

class cg3packer(cg2packer):

936

class cg3packer(cg2packer):

938

version = '03'

937

version = '03'

939

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

938

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

940

939

941

def _packmanifests(self, dir, mfnodes, lookuplinknode):

940

def _packmanifests(self, dir, mfnodes, lookuplinknode):

942

if dir:

941

if dir:

943

yield self.fileheader(dir)

942

yield self.fileheader(dir)

944

for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),

943

for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),

945

lookuplinknode, units=_('manifests')):

944

lookuplinknode, units=_('manifests')):

946

yield chunk

945

yield chunk

947

946

948

def _manifestsdone(self):

947

def _manifestsdone(self):

949

return self.close()

948

return self.close()

950

949

951

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

950

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

952

return struct.pack(

951

return struct.pack(

953

self.deltaheader, node, p1n, p2n, basenode, linknode, flags)

952

self.deltaheader, node, p1n, p2n, basenode, linknode, flags)

954

953

955

_packermap = {'01': (cg1packer, cg1unpacker),

954

_packermap = {'01': (cg1packer, cg1unpacker),

956

# cg2 adds support for exchanging generaldelta

955

# cg2 adds support for exchanging generaldelta

957

'02': (cg2packer, cg2unpacker),

956

'02': (cg2packer, cg2unpacker),

958

# cg3 adds support for exchanging revlog flags and treemanifests

957

# cg3 adds support for exchanging revlog flags and treemanifests

959

'03': (cg3packer, cg3unpacker),

958

'03': (cg3packer, cg3unpacker),

960

}

959

}

961

960

962

def allsupportedversions(ui):

961

def allsupportedversions(ui):

963

versions = set(_packermap.keys())

962

versions = set(_packermap.keys())

964

versions.discard('03')

963

versions.discard('03')

965

if (ui.configbool('experimental', 'changegroup3') or

964

if (ui.configbool('experimental', 'changegroup3') or

966

ui.configbool('experimental', 'treemanifest')):

965

ui.configbool('experimental', 'treemanifest')):

967

versions.add('03')

966

versions.add('03')

968

return versions

967

return versions

969

968

970

# Changegroup versions that can be applied to the repo

969

# Changegroup versions that can be applied to the repo

971

def supportedincomingversions(repo):

970

def supportedincomingversions(repo):

972

versions = allsupportedversions(repo.ui)

971

versions = allsupportedversions(repo.ui)

973

if 'treemanifest' in repo.requirements:

972

if 'treemanifest' in repo.requirements:

974

versions.add('03')

973

versions.add('03')

975

return versions

974

return versions

976

975

977

# Changegroup versions that can be created from the repo

976

# Changegroup versions that can be created from the repo

978

def supportedoutgoingversions(repo):

977

def supportedoutgoingversions(repo):

979

versions = allsupportedversions(repo.ui)

978

versions = allsupportedversions(repo.ui)

980

if 'treemanifest' in repo.requirements:

979

if 'treemanifest' in repo.requirements:

981

# Versions 01 and 02 support only flat manifests and it's just too

980

# Versions 01 and 02 support only flat manifests and it's just too

982

# expensive to convert between the flat manifest and tree manifest on

981

# expensive to convert between the flat manifest and tree manifest on

983

# the fly. Since tree manifests are hashed differently, all of history

982

# the fly. Since tree manifests are hashed differently, all of history

984

# would have to be converted. Instead, we simply don't even pretend to

983

# would have to be converted. Instead, we simply don't even pretend to

985

# support versions 01 and 02.

984

# support versions 01 and 02.

986

versions.discard('01')

985

versions.discard('01')

987

versions.discard('02')

986

versions.discard('02')

988

versions.add('03')

987

versions.add('03')

989

return versions

988

return versions

990

989

991

def safeversion(repo):

990

def safeversion(repo):

992

# Finds the smallest version that it's safe to assume clients of the repo

991

# Finds the smallest version that it's safe to assume clients of the repo

993

# will support. For example, all hg versions that support generaldelta also

992

# will support. For example, all hg versions that support generaldelta also

994

# support changegroup 02.

993

# support changegroup 02.

995

versions = supportedoutgoingversions(repo)

994

versions = supportedoutgoingversions(repo)

996

if 'generaldelta' in repo.requirements:

995

if 'generaldelta' in repo.requirements:

997

versions.discard('01')

996

versions.discard('01')

998

assert versions

997

assert versions

999

return min(versions)

998

return min(versions)

1000

999

1001

def getbundler(version, repo, bundlecaps=None):

1000

def getbundler(version, repo, bundlecaps=None):

1002

assert version in supportedoutgoingversions(repo)

1001

assert version in supportedoutgoingversions(repo)

1003

return _packermap[version][0](repo, bundlecaps)

1002

return _packermap[version][0](repo, bundlecaps)

1004

1003

1005

def getunbundler(version, fh, alg):

1004

def getunbundler(version, fh, alg):

1006

return _packermap[version][1](fh, alg)

1005

return _packermap[version][1](fh, alg)

1007

1006

1008

def _changegroupinfo(repo, nodes, source):

1007

def _changegroupinfo(repo, nodes, source):

1009

if repo.ui.verbose or source == 'bundle':

1008

if repo.ui.verbose or source == 'bundle':

1010

repo.ui.status(_("%d changesets found\n") % len(nodes))

1009

repo.ui.status(_("%d changesets found\n") % len(nodes))

1011

if repo.ui.debugflag:

1010

if repo.ui.debugflag:

1012

repo.ui.debug("list of changesets:\n")

1011

repo.ui.debug("list of changesets:\n")

1013

for node in nodes:

1012

for node in nodes:

1014

repo.ui.debug("%s\n" % hex(node))

1013

repo.ui.debug("%s\n" % hex(node))

1015

1014

1016

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

1015

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

1017

repo = repo.unfiltered()

1016

repo = repo.unfiltered()

1018

commonrevs = outgoing.common

1017

commonrevs = outgoing.common

1019

csets = outgoing.missing

1018

csets = outgoing.missing

1020

heads = outgoing.missingheads

1019

heads = outgoing.missingheads

1021

# We go through the fast path if we get told to, or if all (unfiltered

1020

# We go through the fast path if we get told to, or if all (unfiltered

1022

# heads have been requested (since we then know there all linkrevs will

1021

# heads have been requested (since we then know there all linkrevs will

1023

# be pulled by the client).

1022

# be pulled by the client).

1024

heads.sort()

1023

heads.sort()

1025

fastpathlinkrev = fastpath or (

1024

fastpathlinkrev = fastpath or (

1026

repo.filtername is None and heads == sorted(repo.heads()))

1025

repo.filtername is None and heads == sorted(repo.heads()))

1027

1026

1028

repo.hook('preoutgoing', throw=True, source=source)

1027

repo.hook('preoutgoing', throw=True, source=source)

1029

_changegroupinfo(repo, csets, source)

1028

_changegroupinfo(repo, csets, source)

1030

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1029

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1031

1030

1032

def getsubset(repo, outgoing, bundler, source, fastpath=False):

1031

def getsubset(repo, outgoing, bundler, source, fastpath=False):

1033

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

1032

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

1034

return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)

1033

return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)

1035

1034

1036

def changegroupsubset(repo, roots, heads, source, version='01'):

1035

def changegroupsubset(repo, roots, heads, source, version='01'):

1037

"""Compute a changegroup consisting of all the nodes that are

1036

"""Compute a changegroup consisting of all the nodes that are

1038

descendants of any of the roots and ancestors of any of the heads.

1037

descendants of any of the roots and ancestors of any of the heads.

1039

Return a chunkbuffer object whose read() method will return

1038

Return a chunkbuffer object whose read() method will return

1040

successive changegroup chunks.

1039

successive changegroup chunks.

1041

1040

1042

It is fairly complex as determining which filenodes and which

1041

It is fairly complex as determining which filenodes and which

1043

manifest nodes need to be included for the changeset to be complete

1042

manifest nodes need to be included for the changeset to be complete

1044

is non-trivial.

1043

is non-trivial.

1045

1044

1046

Another wrinkle is doing the reverse, figuring out which changeset in

1045

Another wrinkle is doing the reverse, figuring out which changeset in

1047

the changegroup a particular filenode or manifestnode belongs to.

1046

the changegroup a particular filenode or manifestnode belongs to.

1048

"""

1047

"""

1049

cl = repo.changelog

1048

cl = repo.changelog

1050

if not roots:

1049

if not roots:

1051

roots = [nullid]

1050

roots = [nullid]

1052

discbases = []

1051

discbases = []

1053

for n in roots:

1052

for n in roots:

1054

discbases.extend([p for p in cl.parents(n) if p != nullid])

1053

discbases.extend([p for p in cl.parents(n) if p != nullid])

1055

# TODO: remove call to nodesbetween.

1054

# TODO: remove call to nodesbetween.

1056

csets, roots, heads = cl.nodesbetween(roots, heads)

1055

csets, roots, heads = cl.nodesbetween(roots, heads)

1057

included = set(csets)

1056

included = set(csets)

1058

discbases = [n for n in discbases if n not in included]

1057

discbases = [n for n in discbases if n not in included]

1059

outgoing = discovery.outgoing(cl, discbases, heads)

1058

outgoing = discovery.outgoing(cl, discbases, heads)

1060

bundler = getbundler(version, repo)

1059

bundler = getbundler(version, repo)

1061

return getsubset(repo, outgoing, bundler, source)

1060

return getsubset(repo, outgoing, bundler, source)

1062

1061

1063

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

1062

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

1064

version='01'):

1063

version='01'):

1065

"""Like getbundle, but taking a discovery.outgoing as an argument.

1064

"""Like getbundle, but taking a discovery.outgoing as an argument.

1066

1065

1067

This is only implemented for local repos and reuses potentially

1066

This is only implemented for local repos and reuses potentially

1068

precomputed sets in outgoing. Returns a raw changegroup generator."""

1067

precomputed sets in outgoing. Returns a raw changegroup generator."""

1069

if not outgoing.missing:

1068

if not outgoing.missing:

1070

return None

1069

return None

1071

bundler = getbundler(version, repo, bundlecaps)

1070

bundler = getbundler(version, repo, bundlecaps)

1072

return getsubsetraw(repo, outgoing, bundler, source)

1071

return getsubsetraw(repo, outgoing, bundler, source)

1073

1072

1074

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

1073

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

1075

version='01'):

1074

version='01'):

1076

"""Like getbundle, but taking a discovery.outgoing as an argument.

1075

"""Like getbundle, but taking a discovery.outgoing as an argument.

1077

1076

1078

This is only implemented for local repos and reuses potentially

1077

This is only implemented for local repos and reuses potentially

1079

precomputed sets in outgoing."""

1078

precomputed sets in outgoing."""

1080

if not outgoing.missing:

1079

if not outgoing.missing:

1081

return None

1080

return None

1082

bundler = getbundler(version, repo, bundlecaps)

1081

bundler = getbundler(version, repo, bundlecaps)

1083

return getsubset(repo, outgoing, bundler, source)

1082

return getsubset(repo, outgoing, bundler, source)

1084

1083

1085

def computeoutgoing(repo, heads, common):

1084

def computeoutgoing(repo, heads, common):

1086

"""Computes which revs are outgoing given a set of common

1085

"""Computes which revs are outgoing given a set of common

1087

and a set of heads.

1086

and a set of heads.

1088

1087

1089

This is a separate function so extensions can have access to

1088

This is a separate function so extensions can have access to

1090

the logic.

1089

the logic.

1091

1090

1092

Returns a discovery.outgoing object.

1091

Returns a discovery.outgoing object.

1093

"""

1092

"""

1094

cl = repo.changelog

1093

cl = repo.changelog

1095

if common:

1094

if common:

1096

hasnode = cl.hasnode

1095

hasnode = cl.hasnode

1097

common = [n for n in common if hasnode(n)]

1096

common = [n for n in common if hasnode(n)]

1098

else:

1097

else:

1099

common = [nullid]

1098

common = [nullid]

1100

if not heads:

1099

if not heads:

1101

heads = cl.heads()

1100

heads = cl.heads()

1102

return discovery.outgoing(cl, common, heads)

1101

return discovery.outgoing(cl, common, heads)

1103

1102

1104

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

1103

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

1105

version='01'):

1104

version='01'):

1106

"""Like changegroupsubset, but returns the set difference between the

1105

"""Like changegroupsubset, but returns the set difference between the

1107

ancestors of heads and the ancestors common.

1106

ancestors of heads and the ancestors common.

1108

1107

1109

If heads is None, use the local heads. If common is None, use [nullid].

1108

If heads is None, use the local heads. If common is None, use [nullid].

1110

1109

1111

The nodes in common might not all be known locally due to the way the

1110

The nodes in common might not all be known locally due to the way the

1112

current discovery protocol works.

1111

current discovery protocol works.

1113

"""

1112

"""

1114

outgoing = computeoutgoing(repo, heads, common)

1113

outgoing = computeoutgoing(repo, heads, common)

1115

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

1114

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

1116

version=version)

1115

version=version)

1117

1116

1118

def changegroup(repo, basenodes, source):

1117

def changegroup(repo, basenodes, source):

1119

# to avoid a race we use changegroupsubset() (issue1320)

1118

# to avoid a race we use changegroupsubset() (issue1320)

1120

return changegroupsubset(repo, basenodes, repo.heads(), source)

1119

return changegroupsubset(repo, basenodes, repo.heads(), source)

1121

1120

1122

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

1121

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

1123

revisions = 0

1122

revisions = 0

1124

files = 0

1123

files = 0

1125

while True:

1124

while True:

1126

chunkdata = source.filelogheader()

1125

chunkdata = source.filelogheader()

1127

if not chunkdata:

1126

if not chunkdata:

1128

break

1127

break

1129

f = chunkdata["filename"]

1128

f = chunkdata["filename"]

1130

repo.ui.debug("adding %s revisions\n" % f)

1129

repo.ui.debug("adding %s revisions\n" % f)

1131

pr()

1130

pr()

1132

fl = repo.file(f)

1131

fl = repo.file(f)

1133

o = len(fl)

1132

o = len(fl)

1134

try:

1133

try:

1135

if not fl.addgroup(source, revmap, trp):

1134

if not fl.addgroup(source, revmap, trp):

1136

raise error.Abort(_("received file revlog group is empty"))

1135

raise error.Abort(_("received file revlog group is empty"))

1137

except error.CensoredBaseError as e:

1136

except error.CensoredBaseError as e:

1138

raise error.Abort(_("received delta base is censored: %s") % e)

1137

raise error.Abort(_("received delta base is censored: %s") % e)

1139

revisions += len(fl) - o

1138

revisions += len(fl) - o

1140

files += 1

1139

files += 1

1141

if f in needfiles:

1140

if f in needfiles:

1142

needs = needfiles[f]

1141

needs = needfiles[f]

1143

for new in xrange(o, len(fl)):

1142

for new in xrange(o, len(fl)):

1144

n = fl.node(new)

1143

n = fl.node(new)

1145

if n in needs:

1144

if n in needs:

1146

needs.remove(n)

1145

needs.remove(n)

1147

else:

1146

else:

1148

raise error.Abort(

1147

raise error.Abort(

1149

_("received spurious file revlog entry"))

1148

_("received spurious file revlog entry"))

1150

if not needs:

1149

if not needs:

1151

del needfiles[f]

1150

del needfiles[f]

1152

repo.ui.progress(_('files'), None)

1151

repo.ui.progress(_('files'), None)

1153

1152

1154

for f, needs in needfiles.iteritems():

1153

for f, needs in needfiles.iteritems():

1155

fl = repo.file(f)

1154

fl = repo.file(f)

1156

for n in needs:

1155

for n in needs:

1157

try:

1156

try:

1158

fl.rev(n)

1157

fl.rev(n)

1159

except error.LookupError:

1158

except error.LookupError:

1160

raise error.Abort(

1159

raise error.Abort(

1161

_('missing file data for %s:%s - run hg verify') %

1160

_('missing file data for %s:%s - run hg verify') %

1162

(f, hex(n)))

1161

(f, hex(n)))

1163

1162

1164

return revisions, files

1163

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import tempfile
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from . import (
                 branchmap,
                 dagutil,
                 discovery,
                 error,
                 mdiff,
                 phases,
                 util,
             )
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             _CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             bundletypes = {
                 "": ("", None),       # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", None),
                 "HG10BZ": ("HG10", 'BZ'),
                 "HG10GZ": ("HG10GZ", 'GZ'),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 if bundletype == "HG20":
                     from . import bundle2
                     bundle = bundle2.bundle20(ui)
                     bundle.setcompression(compression)
                     part = bundle.newpart('changegroup', data=cg.getchunks())
                     part.addparam('version', cg.version)
                     chunkiter = bundle.getchunks()
                 else:
                     # compression argument is only for the bundle2 case
                     assert compression is None
                     if cg.version != '01':
                         raise error.Abort(_('old bundle types only supports v1 '
                                             'changegroups'))
                     header, comp = bundletypes[bundletype]
                     if comp not in util.compressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                           % comp)
                     z = util.compressors[comp]()
                     subchunkiter = cg.getchunks()
                     def chunkiter():
                         yield header
                         for chunk in subchunkiter:
                             yield z.compress(chunk)
                         yield z.flush()
                     chunkiter = chunkiter()
                 # parse the changegroup data, otherwise we will block
                 # in case of sshrepo because we don't know the end of the stream
                 # an empty chunkgroup is the end of the changegroup
                 # a changegroup has at least 2 chunkgroups (changelog and manifest).
                 # after that, an empty chunkgroup is the end of the changegroup
                 return writechunks(ui, chunkiter, filename, vfs=vfs)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 _grouplistcount = 1 # One list of files after the manifests
                 def __init__(self, fh, alg):
                     if alg == 'UN':
                         alg = None # get more modern without breaking too much
                     if not alg in util.decompressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     self._stream = util.decompressors[alg](fh)
                     self._type = alg
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta, 'flags': flags}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, changegroup versions 1 and 2 have a series of groups
                     # with one group per file. changegroup 3 has a series of directory
                     # manifests before the files.
                     count = 0
                     emptycount = 0
                     while emptycount < self._grouplistcount:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 if empty and count > 2:
                                     emptycount += 1
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     # We know that we'll never have more manifests than we had
                     # changesets.
                     self.callback = prog(_('manifests'), numchanges)
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     repo.manifest.addgroup(self, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                 def apply(self, repo, srctype, url, emptyok=False,
                           targetphase=phases.draft, expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     try:
                         with repo.transaction("\n".join([srctype,
                                                          util.hidepassword(url)])) as tr:
                             # The transaction could have been created before and already
                             # carries source information. In this case we use the top
                             # level data. We overwrite the argument because we need to use
                             # the top level value (if they exist) in this function.
                             srctype = tr.hookargs.setdefault('source', srctype)
                             url = tr.hookargs.setdefault('url', url)
                             repo.hook('prechangegroup', throw=True, **tr.hookargs)
                             # write changelog data to temp files so concurrent readers
                             # will not see an inconsistent view
                             cl = repo.changelog
                             cl.delayupdate(tr)
                             oldheads = cl.heads()
                             trp = weakref.proxy(tr)
                             # pull off the changeset group
                             repo.ui.status(_("adding changesets\n"))
                             clstart = len(cl)
                             class prog(object):
                                 def __init__(self, step, total):
                                     self._step = step
                                     self._total = total
                                     self._count = 1
                                 def __call__(self):
                                     repo.ui.progress(self._step, self._count,
                                                      unit=_('chunks'), total=self._total)
                                     self._count += 1
                             self.callback = prog(_('changesets'), expectedtotal)
                             efiles = set()
                             def onchangelog(cl, node):
                                 efiles.update(cl.read(node)[3])
                             self.changelogheader()
                             srccontent = cl.addgroup(self, csmap, trp,
                                                      addrevisioncb=onchangelog)
                             efiles = len(efiles)
                             if not (srccontent or emptyok):
                                 raise error.Abort(_("received changelog group is empty"))
                             clend = len(cl)
                             changesets = clend - clstart
                             repo.ui.progress(_('changesets'), None)
                             # pull off the manifest group
                             repo.ui.status(_("adding manifests\n"))
                             self._unpackmanifests(repo, revmap, trp, prog, changesets)
                             needfiles = {}
                             if repo.ui.configbool('server', 'validate', default=False):
                                 # validate incoming csets have their manifests
                                 for cset in xrange(clstart, clend):
                                     mfnode = repo.changelog.read(
                                         repo.changelog.node(cset))[0]
                                     mfest = repo.manifest.readdelta(mfnode)
                                     # store file nodes we must see
                                     for f, n in mfest.iteritems():
                                         needfiles.setdefault(f, set()).add(n)
                             # process the files
                             repo.ui.status(_("adding file changes\n"))
                             self.callback = None
                             pr = prog(_('files'), efiles)
                             newrevs, newfiles = _addchangegroupfiles(
                                 repo, self, revmap, trp, pr, needfiles)
                             revisions += newrevs
                             files += newfiles
                             dh = 0
                             if oldheads:
                                 heads = cl.heads()
                                 dh = len(heads) - len(oldheads)
                                 for h in heads:
                                     if h not in oldheads and repo[h].closesbranch():
                                         dh -= 1
                             htext = ""
                             if dh:
                                 htext = _(" (%+d heads)") % dh
                             repo.ui.status(_("added %d changesets"
                                              " with %d changes to %d files%s\n")
                                              % (changesets, revisions, files, htext))
                             repo.invalidatevolatilesets()
                             if changesets > 0:
                                 if 'node' not in tr.hookargs:
                                     tr.hookargs['node'] = hex(cl.node(clstart))
                                     tr.hookargs['node_last'] = hex(cl.node(clend - 1))
                                     hookargs = dict(tr.hookargs)
                                 else:
                                     hookargs = dict(tr.hookargs)
                                     hookargs['node'] = hex(cl.node(clstart))
                                     hookargs['node_last'] = hex(cl.node(clend - 1))
                                 repo.hook('pretxnchangegroup', throw=True, **hookargs)
                             added = [cl.node(r) for r in xrange(clstart, clend)]
                             publishing = repo.publishing()
                             if srctype in ('push', 'serve'):
                                 # Old servers can not push the boundary themselves.
                                 # New servers won't push the boundary if changeset already
                                 # exists locally as secret
                                 #
                                 # We should not use added here but the list of all change in
                                 # the bundle
                                 if publishing:
                                     phases.advanceboundary(repo, tr, phases.public,
                                                            srccontent)
                                 else:
                                     # Those changesets have been pushed from the
                                     # outside, their phases are going to be pushed
                                     # alongside. Therefor `targetphase` is
                                     # ignored.
                                     phases.advanceboundary(repo, tr, phases.draft,
                                                            srccontent)
                                     phases.retractboundary(repo, tr, phases.draft, added)
                             elif srctype != 'strip':
                                 # publishing only alter behavior during push
                                 #
                                 # strip should not touch boundary at all
                                 phases.retractboundary(repo, tr, targetphase, added)
                             if changesets > 0:
                                 if srctype != 'strip':
                                     # During strip, branchcache is invalid but
                                     # coming call to `destroyed` will repair it.
                                     # In other case we can safely update cache on
                                     # disk.
                                     branchmap.updatecache(repo.filtered('served'))
                                 def runhooks():
                                     # These hooks run when the lock releases, not when the
                                     # transaction closes. So it's possible for the changelog
                                     # to have changed since we last saw it.
                                     if clstart >= len(repo):
                                         return
                                     # forcefully update the on-disk branch cache
                                     repo.ui.debug("updating the branch cache\n")
                                     repo.hook("changegroup", **hookargs)
                                     for n in added:
                                         args = hookargs.copy()
                                         args['node'] = hex(n)
                                         del args['node_last']
                                         repo.hook("incoming", **args)
                                     newheads = [h for h in repo.heads()
                                                 if h not in oldheads]
                                     repo.ui.log("incoming",
                                                 "%s incoming changes - new heads: %s\n",
                                                 len(added),
                                                 ', '.join([hex(c[:6]) for c in newheads]))
                                 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                                 lambda tr: repo._afterlock(runhooks))
                     finally:
                         repo.ui.flush()
                     # never return 0 here:
                     if dh < 0:
                         return dh - 1
                     else:
                         return dh + 1
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
             class cg3unpacker(cg2unpacker):
                 """Unpacker for cg3 streams.
                 cg3 streams add support for exchanging treemanifests and revlog
                 flags. It adds the revlog flags to the delta header and an empty chunk
                 separating manifests and files.
                 """
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '03'
                 _grouplistcount = 2 # One list of manifests and one list of files
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs, flags = headertuple
                     return node, p1, p2, deltabase, cs, flags
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,
                                                               numchanges)
                     while True:
                         chunkdata = self.filelogheader()
                         if not chunkdata:
                             break
                         # If we get here, there are directory manifests in the changegroup
                         d = chunkdata["filename"]
                         repo.ui.debug("adding %s revisions\n" % d)
                         dirlog = repo.manifest.dirlog(d)
                         if not dirlog.addgroup(self, revmap, trp):
                             raise error.Abort(_("received dir revlog group is empty"))
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             def _moddirs(files):
                 """Given a set of modified files, find the list of modified directories.
                 This returns a list of (path to changed dir, changed dir) tuples,
                 as that's what the one client needs anyway.
                 >>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])
                 [('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]
                 """
                 alldirs = set()
                 for f in files:
                     path = f.split('/')[:-1]
                     for i in xrange(len(path) - 1, -1, -1):
                         dn = '/'.join(path[:i])
                         current = dn + '/', path[i] + '/'
                         if current in alldirs:
                             break
                         alldirs.add(current)
                 return sorted(alldirs)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     if units is not None:
                         self._progress(msgbundling, None)
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
                 def _packmanifests(self, dir, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
                     assert not dir
                     for chunk in self.group(mfnodes, self._repo.manifest,
                                             lookuplinknode, units=_('manifests')):
                         yield chunk
                 def _manifestsdone(self):
                     return ''
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     # maps manifest node id -> set(changed files)
                     mfchangedfiles = {}
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         n = c[0]
                         # record the first changeset introducing this manifest version
                         mfs.setdefault(n, x)
                         # Record a complete list of potentially-changed files in
                         # this manifest.
                         mfchangedfiles.setdefault(n, set()).update(c[3])
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Treemanifests don't work correctly with fastpathlinkrev
                     # either, because we don't discover which directory nodes to
                     # send along with files. This could probably be fixed.
                     fastpathlinkrev = fastpathlinkrev and (
                         'treemanifest' not in repo.requirements)
                     for chunk in self.generatemanifests(commonrevs, clrevorder,
                             fastpathlinkrev, mfs, mfchangedfiles, fnodes):
                         yield chunk
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     if not fastpathlinkrev:
                         def linknodes(unused, fname):
                             return fnodes.get(fname, {})
                     else:
                         cln = cl.node
                         def linknodes(filerevlog, fname):
                             llr = filerevlog.linkrev
                             fln = filerevlog.node
                             revs = ((r, llr(r)) for r in filerevlog)
                             return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
                     changedfiles = set()
                     for x in mfchangedfiles.itervalues():
                         changedfiles.update(x)
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
                                       mfchangedfiles, fnodes):
                     repo = self._repo
                     ml = repo.manifest
-                    tmfnodes = {}
+                    tmfnodes = {'': mfs}
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     def makelookupmflinknode(dir):
                         if fastpathlinkrev:
                             assert not dir
                             return mfs.__getitem__
                         if dir:
                             return tmfnodes[dir].get
                         def lookupmflinknode(x):
                             """Callback for looking up the linknode for manifests.
                             Returns the linkrev node for the specified manifest.
                             SIDE EFFECT:
 ) fclnodes gets populated with the list of relevant
                                file nodes if we're not using fastpathlinkrev
 ) When treemanifests are in use, collects treemanifest nodes
                                to send
                             Note that this means manifests must be completely sent to
                             the client before you can trust the list of files and
                             treemanifests to send.
                             """
                             clnode = mfs[x]
                             # We no longer actually care about reading deltas of
                             # the manifest here, because we already know the list
                             # of changed files, so for treemanifests (which
                             # lazily-load anyway to *generate* a readdelta) we can
                             # just load them with read() and then we'll actually
                             # be able to correctly load node IDs from the
                             # submanifest entries.
                             if 'treemanifest' in repo.requirements:
                                 mdata = ml.read(x)
                             else:
                                 mdata = ml.readfast(x)
                             for f in mfchangedfiles[x]:
                                 try:
                                     n = mdata[f]
                                 except KeyError:
                                     continue
                                 # record the first changeset introducing this filelog
                                 # version
                                 fclnodes = fnodes.setdefault(f, {})
                                 fclnode = fclnodes.setdefault(n, clnode)
                                 if clrevorder[clnode] < clrevorder[fclnode]:
                                     fclnodes[n] = clnode
                             # gather list of changed treemanifest nodes
                             if 'treemanifest' in repo.requirements:
                                 submfs = {'/': mdata}
                                 for dn, bn in _moddirs(mfchangedfiles[x]):
                                     try:
                                         submf = submfs[dn]
                                         submf = submf._dirs[bn]
                                     except KeyError:
                                         continue # deleted directory, so nothing to send
                                     submfs[submf.dir()] = submf
                                     tmfclnodes = tmfnodes.setdefault(submf.dir(), {})
                                     tmfclnode = tmfclnodes.setdefault(submf._node, clnode)
                                     if clrevorder[clnode] < clrevorder[tmfclnode]:
                                         tmfclnodes[n] = clnode
                             return clnode
                         return lookupmflinknode
-                    mfnodes = self.prune(ml, mfs, commonrevs)
                     size = 0
-                    for x in self._packmanifests('', mfnodes, makelookupmflinknode('')):
+                    while tmfnodes:
-                        size += len(x)
+                        dir = min(tmfnodes)
-                        yield x
+                        nodes = tmfnodes[dir]
-                    for dir, nodes in tmfnodes.iteritems():
                         prunednodes = self.prune(ml.dirlog(dir), nodes, commonrevs)
                         for x in self._packmanifests(dir, prunednodes,
                                                      makelookupmflinknode(dir)):
                             size += len(x)
                             yield x
+                        del tmfnodes[dir]
                     self._verbosenote(_('%8.i (manifests)\n') % size)
                     yield self._manifestsdone()
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress(msgbundling, None)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     flags = revlog.flags(rev)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     # do nothing with flags, it is implicitly 0 for cg1 and cg2
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def __init__(self, repo, bundlecaps=None):
                     super(cg2packer, self).__init__(repo, bundlecaps)
                     if self._reorder is None:
                         # Since generaldelta is directly supported by cg2, reordering
                         # generally doesn't help, so we disable it by default (treating
                         # bundle.reorder=auto just like bundle.reorder=False).
                         self._reorder = False
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     # Do nothing with flags, it is implicitly 0 in cg1 and cg2
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             class cg3packer(cg2packer):
                 version = '03'
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 def _packmanifests(self, dir, mfnodes, lookuplinknode):
                     if dir:
                         yield self.fileheader(dir)
                     for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),
                                             lookuplinknode, units=_('manifests')):
                         yield chunk
                 def _manifestsdone(self):
                     return self.close()
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     return struct.pack(
                         self.deltaheader, node, p1n, p2n, basenode, linknode, flags)
             _packermap = {'01': (cg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (cg2packer, cg2unpacker),
                          # cg3 adds support for exchanging revlog flags and treemanifests
                          '03': (cg3packer, cg3unpacker),
             }
             def allsupportedversions(ui):
                 versions = set(_packermap.keys())
                 versions.discard('03')
                 if (ui.configbool('experimental', 'changegroup3') or
                     ui.configbool('experimental', 'treemanifest')):
                     versions.add('03')
                 return versions
             # Changegroup versions that can be applied to the repo
             def supportedincomingversions(repo):
                 versions = allsupportedversions(repo.ui)
                 if 'treemanifest' in repo.requirements:
                     versions.add('03')
                 return versions
             # Changegroup versions that can be created from the repo
             def supportedoutgoingversions(repo):
                 versions = allsupportedversions(repo.ui)
                 if 'treemanifest' in repo.requirements:
                     # Versions 01 and 02 support only flat manifests and it's just too
                     # expensive to convert between the flat manifest and tree manifest on
                     # the fly. Since tree manifests are hashed differently, all of history
                     # would have to be converted. Instead, we simply don't even pretend to
                     # support versions 01 and 02.
                     versions.discard('01')
                     versions.discard('02')
                     versions.add('03')
                 return versions
             def safeversion(repo):
                 # Finds the smallest version that it's safe to assume clients of the repo
                 # will support. For example, all hg versions that support generaldelta also
                 # support changegroup 02.
                 versions = supportedoutgoingversions(repo)
                 if 'generaldelta' in repo.requirements:
                     versions.discard('01')
                 assert versions
                 return min(versions)
             def getbundler(version, repo, bundlecaps=None):
                 assert version in supportedoutgoingversions(repo)
                 return _packermap[version][0](repo, bundlecaps)
             def getunbundler(version, fh, alg):
                 return _packermap[version][1](fh, alg)
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 included = set(csets)
                 discbases = [n for n in discbases if n not in included]
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = getbundler(version, repo)
                 return getsubset(repo, outgoing, bundler, source)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = getbundler(version, repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,
                                     version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = getbundler(version, repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,
                                version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,
                                            version=version)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files