upstream/mercurial-mirror Commit - r28228:abf12026

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import os

10

import os

11

import struct

11

import struct

12

import tempfile

12

import tempfile

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

hex,

17

hex,

18

nullid,

18

nullid,

19

nullrev,

19

nullrev,

20

short,

20

short,

21

)

21

)

22

23

from . import (

23

from . import (

24

branchmap,

24

branchmap,

25

dagutil,

25

dagutil,

26

discovery,

26

discovery,

27

error,

27

error,

28

mdiff,

28

mdiff,

29

phases,

29

phases,

30

util,

30

util,

31

)

31

)

32

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

33

_CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

34

_CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"

35

_CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"

35

_CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"

36

37

def readexactly(stream, n):

37

def readexactly(stream, n):

38

'''read n bytes from stream.read and abort if less was available'''

38

'''read n bytes from stream.read and abort if less was available'''

39

s = stream.read(n)

39

s = stream.read(n)

40

if len(s) < n:

40

if len(s) < n:

41

raise error.Abort(_("stream ended unexpectedly"

41

raise error.Abort(_("stream ended unexpectedly"

42

" (got %d bytes, expected %d)")

42

" (got %d bytes, expected %d)")

43

% (len(s), n))

43

% (len(s), n))

44

return s

44

return s

45

46

def getchunk(stream):

46

def getchunk(stream):

47

"""return the next chunk from stream as a string"""

47

"""return the next chunk from stream as a string"""

48

d = readexactly(stream, 4)

48

d = readexactly(stream, 4)

49

l = struct.unpack(">l", d)[0]

49

l = struct.unpack(">l", d)[0]

50

if l <= 4:

50

if l <= 4:

51

if l:

51

if l:

52

raise error.Abort(_("invalid chunk length %d") % l)

52

raise error.Abort(_("invalid chunk length %d") % l)

53

return ""

53

return ""

54

return readexactly(stream, l - 4)

54

return readexactly(stream, l - 4)

55

56

def chunkheader(length):

56

def chunkheader(length):

57

"""return a changegroup chunk header (string)"""

57

"""return a changegroup chunk header (string)"""

58

return struct.pack(">l", length + 4)

58

return struct.pack(">l", length + 4)

59

60

def closechunk():

60

def closechunk():

61

"""return a changegroup chunk header (string) for a zero-length chunk"""

61

"""return a changegroup chunk header (string) for a zero-length chunk"""

62

return struct.pack(">l", 0)

62

return struct.pack(">l", 0)

63

64

def combineresults(results):

64

def combineresults(results):

65

"""logic to combine 0 or more addchangegroup results into one"""

65

"""logic to combine 0 or more addchangegroup results into one"""

66

changedheads = 0

66

changedheads = 0

67

result = 1

67

result = 1

68

for ret in results:

68

for ret in results:

69

# If any changegroup result is 0, return 0

69

# If any changegroup result is 0, return 0

70

if ret == 0:

70

if ret == 0:

71

result = 0

71

result = 0

72

break

72

break

73

if ret < -1:

73

if ret < -1:

74

changedheads += ret + 1

74

changedheads += ret + 1

75

elif ret > 1:

75

elif ret > 1:

76

changedheads += ret - 1

76

changedheads += ret - 1

77

if changedheads > 0:

77

if changedheads > 0:

78

result = 1 + changedheads

78

result = 1 + changedheads

79

elif changedheads < 0:

79

elif changedheads < 0:

80

result = -1 + changedheads

80

result = -1 + changedheads

81

return result

81

return result

82

83

bundletypes = {

83

bundletypes = {

84

"": ("", None), # only when using unbundle on ssh and old http servers

84

"": ("", None), # only when using unbundle on ssh and old http servers

85

# since the unification ssh accepts a header but there

85

# since the unification ssh accepts a header but there

86

# is no capability signaling it.

86

# is no capability signaling it.

87

"HG20": (), # special-cased below

87

"HG20": (), # special-cased below

88

"HG10UN": ("HG10UN", None),

88

"HG10UN": ("HG10UN", None),

89

"HG10BZ": ("HG10", 'BZ'),

89

"HG10BZ": ("HG10", 'BZ'),

90

"HG10GZ": ("HG10GZ", 'GZ'),

90

"HG10GZ": ("HG10GZ", 'GZ'),

91

}

91

}

92

93

# hgweb uses this list to communicate its preferred type

93

# hgweb uses this list to communicate its preferred type

94

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

94

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

95

96

def writechunks(ui, chunks, filename, vfs=None):

96

def writechunks(ui, chunks, filename, vfs=None):

97

"""Write chunks to a file and return its filename.

97

"""Write chunks to a file and return its filename.

98

99

The stream is assumed to be a bundle file.

99

The stream is assumed to be a bundle file.

100

Existing files will not be overwritten.

100

Existing files will not be overwritten.

101

If no filename is specified, a temporary file is created.

101

If no filename is specified, a temporary file is created.

102

"""

102

"""

103

fh = None

103

fh = None

104

cleanup = None

104

cleanup = None

105

try:

105

try:

106

if filename:

106

if filename:

107

if vfs:

107

if vfs:

108

fh = vfs.open(filename, "wb")

108

fh = vfs.open(filename, "wb")

109

else:

109

else:

110

fh = open(filename, "wb")

110

fh = open(filename, "wb")

111

else:

111

else:

112

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

112

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

113

fh = os.fdopen(fd, "wb")

113

fh = os.fdopen(fd, "wb")

114

cleanup = filename

114

cleanup = filename

115

for c in chunks:

115

for c in chunks:

116

fh.write(c)

116

fh.write(c)

117

cleanup = None

117

cleanup = None

118

return filename

118

return filename

119

finally:

119

finally:

120

if fh is not None:

120

if fh is not None:

121

fh.close()

121

fh.close()

122

if cleanup is not None:

122

if cleanup is not None:

123

if filename and vfs:

123

if filename and vfs:

124

vfs.unlink(cleanup)

124

vfs.unlink(cleanup)

125

else:

125

else:

126

os.unlink(cleanup)

126

os.unlink(cleanup)

127

128

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

128

def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):

129

"""Write a bundle file and return its filename.

129

"""Write a bundle file and return its filename.

130

131

Existing files will not be overwritten.

131

Existing files will not be overwritten.

132

If no filename is specified, a temporary file is created.

132

If no filename is specified, a temporary file is created.

133

bz2 compression can be turned off.

133

bz2 compression can be turned off.

134

The bundle file will be deleted in case of errors.

134

The bundle file will be deleted in case of errors.

135

"""

135

"""

136

137

if bundletype == "HG20":

137

if bundletype == "HG20":

138

from . import bundle2

138

from . import bundle2

139

bundle = bundle2.bundle20(ui)

139

bundle = bundle2.bundle20(ui)

140

bundle.setcompression(compression)

140

bundle.setcompression(compression)

141

part = bundle.newpart('changegroup', data=cg.getchunks())

141

part = bundle.newpart('changegroup', data=cg.getchunks())

142

part.addparam('version', cg.version)

142

part.addparam('version', cg.version)

143

chunkiter = bundle.getchunks()

143

chunkiter = bundle.getchunks()

144

else:

144

else:

145

# compression argument is only for the bundle2 case

145

# compression argument is only for the bundle2 case

146

assert compression is None

146

assert compression is None

147

if cg.version != '01':

147

if cg.version != '01':

148

raise error.Abort(_('old bundle types only supports v1 '

148

raise error.Abort(_('old bundle types only supports v1 '

149

'changegroups'))

149

'changegroups'))

150

header, comp = bundletypes[bundletype]

150

header, comp = bundletypes[bundletype]

151

if comp not in util.compressors:

151

if comp not in util.compressors:

152

raise error.Abort(_('unknown stream compression type: %s')

152

raise error.Abort(_('unknown stream compression type: %s')

153

% comp)

153

% comp)

154

z = util.compressors[comp]()

154

z = util.compressors[comp]()

155

subchunkiter = cg.getchunks()

155

subchunkiter = cg.getchunks()

156

def chunkiter():

156

def chunkiter():

157

yield header

157

yield header

158

for chunk in subchunkiter:

158

for chunk in subchunkiter:

159

yield z.compress(chunk)

159

yield z.compress(chunk)

160

yield z.flush()

160

yield z.flush()

161

chunkiter = chunkiter()

161

chunkiter = chunkiter()

162

163

# parse the changegroup data, otherwise we will block

163

# parse the changegroup data, otherwise we will block

164

# in case of sshrepo because we don't know the end of the stream

164

# in case of sshrepo because we don't know the end of the stream

165

166

# an empty chunkgroup is the end of the changegroup

166

# an empty chunkgroup is the end of the changegroup

167

# a changegroup has at least 2 chunkgroups (changelog and manifest).

167

# a changegroup has at least 2 chunkgroups (changelog and manifest).

168

# after that, an empty chunkgroup is the end of the changegroup

168

# after that, an empty chunkgroup is the end of the changegroup

169

return writechunks(ui, chunkiter, filename, vfs=vfs)

169

return writechunks(ui, chunkiter, filename, vfs=vfs)

170

171

class cg1unpacker(object):

171

class cg1unpacker(object):

172

"""Unpacker for cg1 changegroup streams.

172

"""Unpacker for cg1 changegroup streams.

173

174

A changegroup unpacker handles the framing of the revision data in

174

A changegroup unpacker handles the framing of the revision data in

175

the wire format. Most consumers will want to use the apply()

175

the wire format. Most consumers will want to use the apply()

176

method to add the changes from the changegroup to a repository.

176

method to add the changes from the changegroup to a repository.

177

178

If you're forwarding a changegroup unmodified to another consumer,

178

If you're forwarding a changegroup unmodified to another consumer,

179

use getchunks(), which returns an iterator of changegroup

179

use getchunks(), which returns an iterator of changegroup

180

chunks. This is mostly useful for cases where you need to know the

180

chunks. This is mostly useful for cases where you need to know the

181

data stream has ended by observing the end of the changegroup.

181

data stream has ended by observing the end of the changegroup.

182

183

deltachunk() is useful only if you're applying delta data. Most

183

deltachunk() is useful only if you're applying delta data. Most

184

consumers should prefer apply() instead.

184

consumers should prefer apply() instead.

185

186

A few other public methods exist. Those are used only for

186

A few other public methods exist. Those are used only for

187

bundlerepo and some debug commands - their use is discouraged.

187

bundlerepo and some debug commands - their use is discouraged.

188

"""

188

"""

189

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

189

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

190

deltaheadersize = struct.calcsize(deltaheader)

190

deltaheadersize = struct.calcsize(deltaheader)

191

version = '01'

191

version = '01'

192

_grouplistcount = 1 # One list of files after the manifests

192

_grouplistcount = 1 # One list of files after the manifests

193

194

def __init__(self, fh, alg):

194

def __init__(self, fh, alg):

195

if alg == 'UN':

195

if alg == 'UN':

196

alg = None # get more modern without breaking too much

196

alg = None # get more modern without breaking too much

197

if not alg in util.decompressors:

197

if not alg in util.decompressors:

198

raise error.Abort(_('unknown stream compression type: %s')

198

raise error.Abort(_('unknown stream compression type: %s')

199

% alg)

199

% alg)

200

if alg == 'BZ':

200

if alg == 'BZ':

201

alg = '_truncatedBZ'

201

alg = '_truncatedBZ'

202

self._stream = util.decompressors[alg](fh)

202

self._stream = util.decompressors[alg](fh)

203

self._type = alg

203

self._type = alg

204

self.callback = None

204

self.callback = None

205

206

# These methods (compressed, read, seek, tell) all appear to only

206

# These methods (compressed, read, seek, tell) all appear to only

207

# be used by bundlerepo, but it's a little hard to tell.

207

# be used by bundlerepo, but it's a little hard to tell.

208

def compressed(self):

208

def compressed(self):

209

return self._type is not None

209

return self._type is not None

210

def read(self, l):

210

def read(self, l):

211

return self._stream.read(l)

211

return self._stream.read(l)

212

def seek(self, pos):

212

def seek(self, pos):

213

return self._stream.seek(pos)

213

return self._stream.seek(pos)

214

def tell(self):

214

def tell(self):

215

return self._stream.tell()

215

return self._stream.tell()

216

def close(self):

216

def close(self):

217

return self._stream.close()

217

return self._stream.close()

218

219

def _chunklength(self):

219

def _chunklength(self):

220

d = readexactly(self._stream, 4)

220

d = readexactly(self._stream, 4)

221

l = struct.unpack(">l", d)[0]

221

l = struct.unpack(">l", d)[0]

222

if l <= 4:

222

if l <= 4:

223

if l:

223

if l:

224

raise error.Abort(_("invalid chunk length %d") % l)

224

raise error.Abort(_("invalid chunk length %d") % l)

225

return 0

225

return 0

226

if self.callback:

226

if self.callback:

227

self.callback()

227

self.callback()

228

return l - 4

228

return l - 4

229

230

def changelogheader(self):

230

def changelogheader(self):

231

"""v10 does not have a changelog header chunk"""

231

"""v10 does not have a changelog header chunk"""

232

return {}

232

return {}

233

234

def manifestheader(self):

234

def manifestheader(self):

235

"""v10 does not have a manifest header chunk"""

235

"""v10 does not have a manifest header chunk"""

236

return {}

236

return {}

237

238

def filelogheader(self):

238

def filelogheader(self):

239

"""return the header of the filelogs chunk, v10 only has the filename"""

239

"""return the header of the filelogs chunk, v10 only has the filename"""

240

l = self._chunklength()

240

l = self._chunklength()

241

if not l:

241

if not l:

242

return {}

242

return {}

243

fname = readexactly(self._stream, l)

243

fname = readexactly(self._stream, l)

244

return {'filename': fname}

244

return {'filename': fname}

245

246

def _deltaheader(self, headertuple, prevnode):

246

def _deltaheader(self, headertuple, prevnode):

247

node, p1, p2, cs = headertuple

247

node, p1, p2, cs = headertuple

248

if prevnode is None:

248

if prevnode is None:

249

deltabase = p1

249

deltabase = p1

250

else:

250

else:

251

deltabase = prevnode

251

deltabase = prevnode

252

flags = 0

252

flags = 0

253

return node, p1, p2, deltabase, cs, flags

253

return node, p1, p2, deltabase, cs, flags

254

255

def deltachunk(self, prevnode):

255

def deltachunk(self, prevnode):

256

l = self._chunklength()

256

l = self._chunklength()

257

if not l:

257

if not l:

258

return {}

258

return {}

259

headerdata = readexactly(self._stream, self.deltaheadersize)

259

headerdata = readexactly(self._stream, self.deltaheadersize)

260

header = struct.unpack(self.deltaheader, headerdata)

260

header = struct.unpack(self.deltaheader, headerdata)

261

delta = readexactly(self._stream, l - self.deltaheadersize)

261

delta = readexactly(self._stream, l - self.deltaheadersize)

262

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

262

node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)

263

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

263

return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,

264

'deltabase': deltabase, 'delta': delta, 'flags': flags}

264

'deltabase': deltabase, 'delta': delta, 'flags': flags}

265

266

def getchunks(self):

266

def getchunks(self):

267

"""returns all the chunks contains in the bundle

267

"""returns all the chunks contains in the bundle

268

269

Used when you need to forward the binary stream to a file or another

269

Used when you need to forward the binary stream to a file or another

270

network API. To do so, it parse the changegroup data, otherwise it will

270

network API. To do so, it parse the changegroup data, otherwise it will

271

block in case of sshrepo because it don't know the end of the stream.

271

block in case of sshrepo because it don't know the end of the stream.

272

"""

272

"""

273

# an empty chunkgroup is the end of the changegroup

273

# an empty chunkgroup is the end of the changegroup

274

# a changegroup has at least 2 chunkgroups (changelog and manifest).

274

# a changegroup has at least 2 chunkgroups (changelog and manifest).

275

# after that, changegroup versions 1 and 2 have a series of groups

275

# after that, changegroup versions 1 and 2 have a series of groups

276

# with one group per file. changegroup 3 has a series of directory

276

# with one group per file. changegroup 3 has a series of directory

277

# manifests before the files.

277

# manifests before the files.

278

count = 0

278

count = 0

279

emptycount = 0

279

emptycount = 0

280

while emptycount < self._grouplistcount:

280

while emptycount < self._grouplistcount:

281

empty = True

281

empty = True

282

count += 1

282

count += 1

283

while True:

283

while True:

284

chunk = getchunk(self)

284

chunk = getchunk(self)

285

if not chunk:

285

if not chunk:

286

if empty and count > 2:

286

if empty and count > 2:

287

emptycount += 1

287

emptycount += 1

288

break

288

break

289

empty = False

289

empty = False

290

yield chunkheader(len(chunk))

290

yield chunkheader(len(chunk))

291

pos = 0

291

pos = 0

292

while pos < len(chunk):

292

while pos < len(chunk):

293

next = pos + 2**20

293

next = pos + 2**20

294

yield chunk[pos:next]

294

yield chunk[pos:next]

295

pos = next

295

pos = next

296

yield closechunk()

296

yield closechunk()

297

298

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

298

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

299

# We know that we'll never have more manifests than we had

299

# We know that we'll never have more manifests than we had

300

# changesets.

300

# changesets.

301

self.callback = prog(_('manifests'), numchanges)

301

self.callback = prog(_('manifests'), numchanges)

302

# no need to check for empty manifest group here:

302

# no need to check for empty manifest group here:

303

# if the result of the merge of 1 and 2 is the same in 3 and 4,

303

# if the result of the merge of 1 and 2 is the same in 3 and 4,

304

# no new manifest will be created and the manifest group will

304

# no new manifest will be created and the manifest group will

305

# be empty during the pull

305

# be empty during the pull

306

self.manifestheader()

306

self.manifestheader()

307

repo.manifest.addgroup(self, revmap, trp)

307

repo.manifest.addgroup(self, revmap, trp)

308

repo.ui.progress(_('manifests'), None)

308

repo.ui.progress(_('manifests'), None)

309

310

def apply(self, repo, srctype, url, emptyok=False,

310

def apply(self, repo, srctype, url, emptyok=False,

311

targetphase=phases.draft, expectedtotal=None):

311

targetphase=phases.draft, expectedtotal=None):

312

"""Add the changegroup returned by source.read() to this repo.

312

"""Add the changegroup returned by source.read() to this repo.

313

srctype is a string like 'push', 'pull', or 'unbundle'. url is

313

srctype is a string like 'push', 'pull', or 'unbundle'. url is

314

the URL of the repo where this changegroup is coming from.

314

the URL of the repo where this changegroup is coming from.

315

316

Return an integer summarizing the change to this repo:

316

Return an integer summarizing the change to this repo:

317

- nothing changed or no source: 0

317

- nothing changed or no source: 0

318

- more heads than before: 1+added heads (2..n)

318

- more heads than before: 1+added heads (2..n)

319

- fewer heads than before: -1-removed heads (-2..-n)

319

- fewer heads than before: -1-removed heads (-2..-n)

320

- number of heads stays the same: 1

320

- number of heads stays the same: 1

321

"""

321

"""

322

repo = repo.unfiltered()

322

repo = repo.unfiltered()

323

def csmap(x):

323

def csmap(x):

324

repo.ui.debug("add changeset %s\n" % short(x))

324

repo.ui.debug("add changeset %s\n" % short(x))

325

return len(cl)

325

return len(cl)

326

327

def revmap(x):

327

def revmap(x):

328

return cl.rev(x)

328

return cl.rev(x)

329

330

changesets = files = revisions = 0

330

changesets = files = revisions = 0

331

332

try:

332

try:

333

with repo.transaction("\n".join([srctype,

333

with repo.transaction("\n".join([srctype,

334

util.hidepassword(url)])) as tr:

334

util.hidepassword(url)])) as tr:

335

# The transaction could have been created before and already

335

# The transaction could have been created before and already

336

# carries source information. In this case we use the top

336

# carries source information. In this case we use the top

337

# level data. We overwrite the argument because we need to use

337

# level data. We overwrite the argument because we need to use

338

# the top level value (if they exist) in this function.

338

# the top level value (if they exist) in this function.

339

srctype = tr.hookargs.setdefault('source', srctype)

339

srctype = tr.hookargs.setdefault('source', srctype)

340

url = tr.hookargs.setdefault('url', url)

340

url = tr.hookargs.setdefault('url', url)

341

repo.hook('prechangegroup', throw=True, **tr.hookargs)

341

repo.hook('prechangegroup', throw=True, **tr.hookargs)

342

343

# write changelog data to temp files so concurrent readers

343

# write changelog data to temp files so concurrent readers

344

# will not see an inconsistent view

344

# will not see an inconsistent view

345

cl = repo.changelog

345

cl = repo.changelog

346

cl.delayupdate(tr)

346

cl.delayupdate(tr)

347

oldheads = cl.heads()

347

oldheads = cl.heads()

348

349

trp = weakref.proxy(tr)

349

trp = weakref.proxy(tr)

350

# pull off the changeset group

350

# pull off the changeset group

351

repo.ui.status(_("adding changesets\n"))

351

repo.ui.status(_("adding changesets\n"))

352

clstart = len(cl)

352

clstart = len(cl)

353

class prog(object):

353

class prog(object):

354

def __init__(self, step, total):

354

def __init__(self, step, total):

355

self._step = step

355

self._step = step

356

self._total = total

356

self._total = total

357

self._count = 1

357

self._count = 1

358

def __call__(self):

358

def __call__(self):

359

repo.ui.progress(self._step, self._count,

359

repo.ui.progress(self._step, self._count,

360

unit=_('chunks'), total=self._total)

360

unit=_('chunks'), total=self._total)

361

self._count += 1

361

self._count += 1

362

self.callback = prog(_('changesets'), expectedtotal)

362

self.callback = prog(_('changesets'), expectedtotal)

363

364

efiles = set()

364

efiles = set()

365

def onchangelog(cl, node):

365

def onchangelog(cl, node):

366

efiles.update(cl.read(node)[3])

366

efiles.update(cl.read(node)[3])

367

368

self.changelogheader()

368

self.changelogheader()

369

srccontent = cl.addgroup(self, csmap, trp,

369

srccontent = cl.addgroup(self, csmap, trp,

370

addrevisioncb=onchangelog)

370

addrevisioncb=onchangelog)

371

efiles = len(efiles)

371

efiles = len(efiles)

372

373

if not (srccontent or emptyok):

373

if not (srccontent or emptyok):

374

raise error.Abort(_("received changelog group is empty"))

374

raise error.Abort(_("received changelog group is empty"))

375

clend = len(cl)

375

clend = len(cl)

376

changesets = clend - clstart

376

changesets = clend - clstart

377

repo.ui.progress(_('changesets'), None)

377

repo.ui.progress(_('changesets'), None)

378

379

# pull off the manifest group

379

# pull off the manifest group

380

repo.ui.status(_("adding manifests\n"))

380

repo.ui.status(_("adding manifests\n"))

381

self._unpackmanifests(repo, revmap, trp, prog, changesets)

381

self._unpackmanifests(repo, revmap, trp, prog, changesets)

382

383

needfiles = {}

383

needfiles = {}

384

if repo.ui.configbool('server', 'validate', default=False):

384

if repo.ui.configbool('server', 'validate', default=False):

385

# validate incoming csets have their manifests

385

# validate incoming csets have their manifests

386

for cset in xrange(clstart, clend):

386

for cset in xrange(clstart, clend):

387

mfnode = repo.changelog.read(

387

mfnode = repo.changelog.read(

388

repo.changelog.node(cset))[0]

388

repo.changelog.node(cset))[0]

389

mfest = repo.manifest.readdelta(mfnode)

389

mfest = repo.manifest.readdelta(mfnode)

390

# store file nodes we must see

390

# store file nodes we must see

391

for f, n in mfest.iteritems():

391

for f, n in mfest.iteritems():

392

needfiles.setdefault(f, set()).add(n)

392

needfiles.setdefault(f, set()).add(n)

393

394

# process the files

394

# process the files

395

repo.ui.status(_("adding file changes\n"))

395

repo.ui.status(_("adding file changes\n"))

396

self.callback = None

396

self.callback = None

397

pr = prog(_('files'), efiles)

397

pr = prog(_('files'), efiles)

398

newrevs, newfiles = _addchangegroupfiles(

398

newrevs, newfiles = _addchangegroupfiles(

399

repo, self, revmap, trp, pr, needfiles)

399

repo, self, revmap, trp, pr, needfiles)

400

revisions += newrevs

400

revisions += newrevs

401

files += newfiles

401

files += newfiles

402

403

dh = 0

403

dh = 0

404

if oldheads:

404

if oldheads:

405

heads = cl.heads()

405

heads = cl.heads()

406

dh = len(heads) - len(oldheads)

406

dh = len(heads) - len(oldheads)

407

for h in heads:

407

for h in heads:

408

if h not in oldheads and repo[h].closesbranch():

408

if h not in oldheads and repo[h].closesbranch():

409

dh -= 1

409

dh -= 1

410

htext = ""

410

htext = ""

411

if dh:

411

if dh:

412

htext = _(" (%+d heads)") % dh

412

htext = _(" (%+d heads)") % dh

413

414

repo.ui.status(_("added %d changesets"

414

repo.ui.status(_("added %d changesets"

415

" with %d changes to %d files%s\n")

415

" with %d changes to %d files%s\n")

416

% (changesets, revisions, files, htext))

416

% (changesets, revisions, files, htext))

417

repo.invalidatevolatilesets()

417

repo.invalidatevolatilesets()

418

419

if changesets > 0:

419

if changesets > 0:

420

if 'node' not in tr.hookargs:

420

if 'node' not in tr.hookargs:

421

tr.hookargs['node'] = hex(cl.node(clstart))

421

tr.hookargs['node'] = hex(cl.node(clstart))

422

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

422

tr.hookargs['node_last'] = hex(cl.node(clend - 1))

423

hookargs = dict(tr.hookargs)

423

hookargs = dict(tr.hookargs)

424

else:

424

else:

425

hookargs = dict(tr.hookargs)

425

hookargs = dict(tr.hookargs)

426

hookargs['node'] = hex(cl.node(clstart))

426

hookargs['node'] = hex(cl.node(clstart))

427

hookargs['node_last'] = hex(cl.node(clend - 1))

427

hookargs['node_last'] = hex(cl.node(clend - 1))

428

repo.hook('pretxnchangegroup', throw=True, **hookargs)

428

repo.hook('pretxnchangegroup', throw=True, **hookargs)

429

430

added = [cl.node(r) for r in xrange(clstart, clend)]

430

added = [cl.node(r) for r in xrange(clstart, clend)]

431

publishing = repo.publishing()

431

publishing = repo.publishing()

432

if srctype in ('push', 'serve'):

432

if srctype in ('push', 'serve'):

433

# Old servers can not push the boundary themselves.

433

# Old servers can not push the boundary themselves.

434

# New servers won't push the boundary if changeset already

434

# New servers won't push the boundary if changeset already

435

# exists locally as secret

435

# exists locally as secret

436

#

436

#

437

# We should not use added here but the list of all change in

437

# We should not use added here but the list of all change in

438

# the bundle

438

# the bundle

439

if publishing:

439

if publishing:

440

phases.advanceboundary(repo, tr, phases.public,

440

phases.advanceboundary(repo, tr, phases.public,

441

srccontent)

441

srccontent)

442

else:

442

else:

443

# Those changesets have been pushed from the

443

# Those changesets have been pushed from the

444

# outside, their phases are going to be pushed

444

# outside, their phases are going to be pushed

445

# alongside. Therefor `targetphase` is

445

# alongside. Therefor `targetphase` is

446

# ignored.

446

# ignored.

447

phases.advanceboundary(repo, tr, phases.draft,

447

phases.advanceboundary(repo, tr, phases.draft,

448

srccontent)

448

srccontent)

449

phases.retractboundary(repo, tr, phases.draft, added)

449

phases.retractboundary(repo, tr, phases.draft, added)

450

elif srctype != 'strip':

450

elif srctype != 'strip':

451

# publishing only alter behavior during push

451

# publishing only alter behavior during push

452

#

452

#

453

# strip should not touch boundary at all

453

# strip should not touch boundary at all

454

phases.retractboundary(repo, tr, targetphase, added)

454

phases.retractboundary(repo, tr, targetphase, added)

455

456

if changesets > 0:

456

if changesets > 0:

457

if srctype != 'strip':

457

if srctype != 'strip':

458

# During strip, branchcache is invalid but

458

# During strip, branchcache is invalid but

459

# coming call to `destroyed` will repair it.

459

# coming call to `destroyed` will repair it.

460

# In other case we can safely update cache on

460

# In other case we can safely update cache on

461

# disk.

461

# disk.

462

branchmap.updatecache(repo.filtered('served'))

462

branchmap.updatecache(repo.filtered('served'))

463

464

def runhooks():

464

def runhooks():

465

# These hooks run when the lock releases, not when the

465

# These hooks run when the lock releases, not when the

466

# transaction closes. So it's possible for the changelog

466

# transaction closes. So it's possible for the changelog

467

# to have changed since we last saw it.

467

# to have changed since we last saw it.

468

if clstart >= len(repo):

468

if clstart >= len(repo):

469

return

469

return

470

471

# forcefully update the on-disk branch cache

471

# forcefully update the on-disk branch cache

472

repo.ui.debug("updating the branch cache\n")

472

repo.ui.debug("updating the branch cache\n")

473

repo.hook("changegroup", **hookargs)

473

repo.hook("changegroup", **hookargs)

474

475

for n in added:

475

for n in added:

476

args = hookargs.copy()

476

args = hookargs.copy()

477

args['node'] = hex(n)

477

args['node'] = hex(n)

478

del args['node_last']

478

del args['node_last']

479

repo.hook("incoming", **args)

479

repo.hook("incoming", **args)

480

481

newheads = [h for h in repo.heads()

481

newheads = [h for h in repo.heads()

482

if h not in oldheads]

482

if h not in oldheads]

483

repo.ui.log("incoming",

483

repo.ui.log("incoming",

484

"%s incoming changes - new heads: %s\n",

484

"%s incoming changes - new heads: %s\n",

485

len(added),

485

len(added),

486

', '.join([hex(c[:6]) for c in newheads]))

486

', '.join([hex(c[:6]) for c in newheads]))

487

488

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

488

tr.addpostclose('changegroup-runhooks-%020i' % clstart,

489

lambda tr: repo._afterlock(runhooks))

489

lambda tr: repo._afterlock(runhooks))

490

finally:

490

finally:

491

repo.ui.flush()

491

repo.ui.flush()

492

# never return 0 here:

492

# never return 0 here:

493

if dh < 0:

493

if dh < 0:

494

return dh - 1

494

return dh - 1

495

else:

495

else:

496

return dh + 1

496

return dh + 1

497

498

class cg2unpacker(cg1unpacker):

498

class cg2unpacker(cg1unpacker):

499

"""Unpacker for cg2 streams.

499

"""Unpacker for cg2 streams.

500

501

cg2 streams add support for generaldelta, so the delta header

501

cg2 streams add support for generaldelta, so the delta header

502

format is slightly different. All other features about the data

502

format is slightly different. All other features about the data

503

remain the same.

503

remain the same.

504

"""

504

"""

505

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

505

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

506

deltaheadersize = struct.calcsize(deltaheader)

506

deltaheadersize = struct.calcsize(deltaheader)

507

version = '02'

507

version = '02'

508

509

def _deltaheader(self, headertuple, prevnode):

509

def _deltaheader(self, headertuple, prevnode):

510

node, p1, p2, deltabase, cs = headertuple

510

node, p1, p2, deltabase, cs = headertuple

511

flags = 0

511

flags = 0

512

return node, p1, p2, deltabase, cs, flags

512

return node, p1, p2, deltabase, cs, flags

513

514

class cg3unpacker(cg2unpacker):

514

class cg3unpacker(cg2unpacker):

515

"""Unpacker for cg3 streams.

515

"""Unpacker for cg3 streams.

516

517

cg3 streams add support for exchanging treemanifests and revlog

517

cg3 streams add support for exchanging treemanifests and revlog

518

flags. It adds the revlog flags to the delta header and an empty chunk

518

flags. It adds the revlog flags to the delta header and an empty chunk

519

separating manifests and files.

519

separating manifests and files.

520

"""

520

"""

521

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

521

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

522

deltaheadersize = struct.calcsize(deltaheader)

522

deltaheadersize = struct.calcsize(deltaheader)

523

version = '03'

523

version = '03'

524

_grouplistcount = 2 # One list of manifests and one list of files

524

_grouplistcount = 2 # One list of manifests and one list of files

525

526

def _deltaheader(self, headertuple, prevnode):

526

def _deltaheader(self, headertuple, prevnode):

527

node, p1, p2, deltabase, cs, flags = headertuple

527

node, p1, p2, deltabase, cs, flags = headertuple

528

return node, p1, p2, deltabase, cs, flags

528

return node, p1, p2, deltabase, cs, flags

529

530

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

530

def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):

531

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,

531

super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,

532

numchanges)

532

numchanges)

533

while True:

533

while True:

534

chunkdata = self.filelogheader()

534

chunkdata = self.filelogheader()

535

if not chunkdata:

535

if not chunkdata:

536

break

536

break

537

# If we get here, there are directory manifests in the changegroup

537

# If we get here, there are directory manifests in the changegroup

538

d = chunkdata["filename"]

538

d = chunkdata["filename"]

539

repo.ui.debug("adding %s revisions\n" % d)

539

repo.ui.debug("adding %s revisions\n" % d)

540

dirlog = repo.manifest.dirlog(d)

540

dirlog = repo.manifest.dirlog(d)

541

if not dirlog.addgroup(self, revmap, trp):

541

if not dirlog.addgroup(self, revmap, trp):

542

raise error.Abort(_("received dir revlog group is empty"))

542

raise error.Abort(_("received dir revlog group is empty"))

543

544

class headerlessfixup(object):

544

class headerlessfixup(object):

545

def __init__(self, fh, h):

545

def __init__(self, fh, h):

546

self._h = h

546

self._h = h

547

self._fh = fh

547

self._fh = fh

548

def read(self, n):

548

def read(self, n):

549

if self._h:

549

if self._h:

550

d, self._h = self._h[:n], self._h[n:]

550

d, self._h = self._h[:n], self._h[n:]

551

if len(d) < n:

551

if len(d) < n:

552

d += readexactly(self._fh, n - len(d))

552

d += readexactly(self._fh, n - len(d))

553

return d

553

return d

554

return readexactly(self._fh, n)

554

return readexactly(self._fh, n)

555

556

def _moddirs(files):

556

def _moddirs(files):

557

"""Given a set of modified files, find the list of modified directories.

557

"""Given a set of modified files, find the list of modified directories.

558

559

This returns a list of (path to changed dir, changed dir) tuples,

559

This returns a list of (path to changed dir, changed dir) tuples,

560

as that's what the one client needs anyway.

560

as that's what the one client needs anyway.

561

562

>>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])

562

>>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])

563

[('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]

563

[('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]

564

565

"""

565

"""

566

alldirs = set()

566

alldirs = set()

567

for f in files:

567

for f in files:

568

path = f.split('/')[:-1]

568

path = f.split('/')[:-1]

569

for i in xrange(len(path) - 1, -1, -1):

569

for i in xrange(len(path) - 1, -1, -1):

570

dn = '/'.join(path[:i])

570

dn = '/'.join(path[:i])

571

current = dn + '/', path[i] + '/'

571

current = dn + '/', path[i] + '/'

572

if current in alldirs:

572

if current in alldirs:

573

break

573

break

574

alldirs.add(current)

574

alldirs.add(current)

575

return sorted(alldirs)

575

return sorted(alldirs)

576

577

class cg1packer(object):

577

class cg1packer(object):

578

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

578

deltaheader = _CHANGEGROUPV1_DELTA_HEADER

579

version = '01'

579

version = '01'

580

def __init__(self, repo, bundlecaps=None):

580

def __init__(self, repo, bundlecaps=None):

581

"""Given a source repo, construct a bundler.

581

"""Given a source repo, construct a bundler.

582

583

bundlecaps is optional and can be used to specify the set of

583

bundlecaps is optional and can be used to specify the set of

584

capabilities which can be used to build the bundle.

584

capabilities which can be used to build the bundle.

585

"""

585

"""

586

# Set of capabilities we can use to build the bundle.

586

# Set of capabilities we can use to build the bundle.

587

if bundlecaps is None:

587

if bundlecaps is None:

588

bundlecaps = set()

588

bundlecaps = set()

589

self._bundlecaps = bundlecaps

589

self._bundlecaps = bundlecaps

590

# experimental config: bundle.reorder

590

# experimental config: bundle.reorder

591

reorder = repo.ui.config('bundle', 'reorder', 'auto')

591

reorder = repo.ui.config('bundle', 'reorder', 'auto')

592

if reorder == 'auto':

592

if reorder == 'auto':

593

reorder = None

593

reorder = None

594

else:

594

else:

595

reorder = util.parsebool(reorder)

595

reorder = util.parsebool(reorder)

596

self._repo = repo

596

self._repo = repo

597

self._reorder = reorder

597

self._reorder = reorder

598

self._progress = repo.ui.progress

598

self._progress = repo.ui.progress

599

if self._repo.ui.verbose and not self._repo.ui.debugflag:

599

if self._repo.ui.verbose and not self._repo.ui.debugflag:

600

self._verbosenote = self._repo.ui.note

600

self._verbosenote = self._repo.ui.note

601

else:

601

else:

602

self._verbosenote = lambda s: None

602

self._verbosenote = lambda s: None

603

604

def close(self):

604

def close(self):

605

return closechunk()

605

return closechunk()

606

607

def fileheader(self, fname):

607

def fileheader(self, fname):

608

return chunkheader(len(fname)) + fname

608

return chunkheader(len(fname)) + fname

609

610

def group(self, nodelist, revlog, lookup, units=None):

610

def group(self, nodelist, revlog, lookup, units=None):

611

"""Calculate a delta group, yielding a sequence of changegroup chunks

611

"""Calculate a delta group, yielding a sequence of changegroup chunks

612

(strings).

612

(strings).

613

614

Given a list of changeset revs, return a set of deltas and

614

Given a list of changeset revs, return a set of deltas and

615

metadata corresponding to nodes. The first delta is

615

metadata corresponding to nodes. The first delta is

616

first parent(nodelist[0]) -> nodelist[0], the receiver is

616

first parent(nodelist[0]) -> nodelist[0], the receiver is

617

guaranteed to have this parent as it has all history before

617

guaranteed to have this parent as it has all history before

618

these changesets. In the case firstparent is nullrev the

618

these changesets. In the case firstparent is nullrev the

619

changegroup starts with a full revision.

619

changegroup starts with a full revision.

620

621

If units is not None, progress detail will be generated, units specifies

621

If units is not None, progress detail will be generated, units specifies

622

the type of revlog that is touched (changelog, manifest, etc.).

622

the type of revlog that is touched (changelog, manifest, etc.).

623

"""

623

"""

624

# if we don't have any revisions touched by these changesets, bail

624

# if we don't have any revisions touched by these changesets, bail

625

if len(nodelist) == 0:

625

if len(nodelist) == 0:

626

yield self.close()

626

yield self.close()

627

return

627

return

628

629

# for generaldelta revlogs, we linearize the revs; this will both be

629

# for generaldelta revlogs, we linearize the revs; this will both be

630

# much quicker and generate a much smaller bundle

630

# much quicker and generate a much smaller bundle

631

if (revlog._generaldelta and self._reorder is None) or self._reorder:

631

if (revlog._generaldelta and self._reorder is None) or self._reorder:

632

dag = dagutil.revlogdag(revlog)

632

dag = dagutil.revlogdag(revlog)

633

revs = set(revlog.rev(n) for n in nodelist)

633

revs = set(revlog.rev(n) for n in nodelist)

634

revs = dag.linearize(revs)

634

revs = dag.linearize(revs)

635

else:

635

else:

636

revs = sorted([revlog.rev(n) for n in nodelist])

636

revs = sorted([revlog.rev(n) for n in nodelist])

637

638

# add the parent of the first rev

638

# add the parent of the first rev

639

p = revlog.parentrevs(revs[0])[0]

639

p = revlog.parentrevs(revs[0])[0]

640

revs.insert(0, p)

640

revs.insert(0, p)

641

642

# build deltas

642

# build deltas

643

total = len(revs) - 1

643

total = len(revs) - 1

644

msgbundling = _('bundling')

644

msgbundling = _('bundling')

645

for r in xrange(len(revs) - 1):

645

for r in xrange(len(revs) - 1):

646

if units is not None:

646

if units is not None:

647

self._progress(msgbundling, r + 1, unit=units, total=total)

647

self._progress(msgbundling, r + 1, unit=units, total=total)

648

prev, curr = revs[r], revs[r + 1]

648

prev, curr = revs[r], revs[r + 1]

649

linknode = lookup(revlog.node(curr))

649

linknode = lookup(revlog.node(curr))

650

for c in self.revchunk(revlog, curr, prev, linknode):

650

for c in self.revchunk(revlog, curr, prev, linknode):

651

yield c

651

yield c

652

653

if units is not None:

653

if units is not None:

654

self._progress(msgbundling, None)

654

self._progress(msgbundling, None)

655

yield self.close()

655

yield self.close()

656

657

# filter any nodes that claim to be part of the known set

657

# filter any nodes that claim to be part of the known set

658

def prune(self, revlog, missing, commonrevs):

658

def prune(self, revlog, missing, commonrevs):

659

rr, rl = revlog.rev, revlog.linkrev

659

rr, rl = revlog.rev, revlog.linkrev

660

return [n for n in missing if rl(rr(n)) not in commonrevs]

660

return [n for n in missing if rl(rr(n)) not in commonrevs]

661

662

def _packmanifests(self, ~~mfnodes~~, tmfnodes, lookuplinknode):

662

def _packmanifests(self, dir, mfnodes, lookuplinknode):

663

"""Pack flat manifests into a changegroup stream."""

663

"""Pack flat manifests into a changegroup stream."""

664

ml = self._repo.manifest

664

assert not dir

665

size = 0

665

for chunk in self.group(mfnodes, self._repo.manifest,

666

for chunk in self.group(

666

lookuplinknode, units=_('manifests')):

667

mfnodes, ml, lookuplinknode, units=_('manifests')):

668

size += len(chunk)

669

yield chunk

667

yield chunk

670

self._verbosenote(_('%8.i (manifests)\n') % size)

668

671

# It looks odd to assert this here, but tmfnodes doesn't get

669

def _manifestsdone(self):

672

# filled in until after we've called lookuplinknode for

670

return ''

673

# sending root manifests, so the only way to tell the streams

674

# got crossed is to check after we've done all the work.

675

assert not tmfnodes

676

671

677

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

672

def generate(self, commonrevs, clnodes, fastpathlinkrev, source):

678

'''yield a sequence of changegroup chunks (strings)'''

673

'''yield a sequence of changegroup chunks (strings)'''

679

repo = self._repo

674

repo = self._repo

680

cl = repo.changelog

675

cl = repo.changelog

681

676

682

clrevorder = {}

677

clrevorder = {}

683

mfs = {} # needed manifests

678

mfs = {} # needed manifests

684

fnodes = {} # needed file nodes

679

fnodes = {} # needed file nodes

685

# maps manifest node id -> set(changed files)

680

# maps manifest node id -> set(changed files)

686

mfchangedfiles = {}

681

mfchangedfiles = {}

687

682

688

# Callback for the changelog, used to collect changed files and manifest

683

# Callback for the changelog, used to collect changed files and manifest

689

# nodes.

684

# nodes.

690

# Returns the linkrev node (identity in the changelog case).

685

# Returns the linkrev node (identity in the changelog case).

691

def lookupcl(x):

686

def lookupcl(x):

692

c = cl.read(x)

687

c = cl.read(x)

693

clrevorder[x] = len(clrevorder)

688

clrevorder[x] = len(clrevorder)

694

n = c[0]

689

n = c[0]

695

# record the first changeset introducing this manifest version

690

# record the first changeset introducing this manifest version

696

mfs.setdefault(n, x)

691

mfs.setdefault(n, x)

697

# Record a complete list of potentially-changed files in

692

# Record a complete list of potentially-changed files in

698

# this manifest.

693

# this manifest.

699

mfchangedfiles.setdefault(n, set()).update(c[3])

694

mfchangedfiles.setdefault(n, set()).update(c[3])

700

return x

695

return x

701

696

702

self._verbosenote(_('uncompressed size of bundle content:\n'))

697

self._verbosenote(_('uncompressed size of bundle content:\n'))

703

size = 0

698

size = 0

704

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

699

for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):

705

size += len(chunk)

700

size += len(chunk)

706

yield chunk

701

yield chunk

707

self._verbosenote(_('%8.i (changelog)\n') % size)

702

self._verbosenote(_('%8.i (changelog)\n') % size)

708

703

709

# We need to make sure that the linkrev in the changegroup refers to

704

# We need to make sure that the linkrev in the changegroup refers to

710

# the first changeset that introduced the manifest or file revision.

705

# the first changeset that introduced the manifest or file revision.

711

# The fastpath is usually safer than the slowpath, because the filelogs

706

# The fastpath is usually safer than the slowpath, because the filelogs

712

# are walked in revlog order.

707

# are walked in revlog order.

713

#

708

#

714

# When taking the slowpath with reorder=None and the manifest revlog

709

# When taking the slowpath with reorder=None and the manifest revlog

715

# uses generaldelta, the manifest may be walked in the "wrong" order.

710

# uses generaldelta, the manifest may be walked in the "wrong" order.

716

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

711

# Without 'clrevorder', we would get an incorrect linkrev (see fix in

717

# cc0ff93d0c0c).

712

# cc0ff93d0c0c).

718

#

713

#

719

# When taking the fastpath, we are only vulnerable to reordering

714

# When taking the fastpath, we are only vulnerable to reordering

720

# of the changelog itself. The changelog never uses generaldelta, so

715

# of the changelog itself. The changelog never uses generaldelta, so

721

# it is only reordered when reorder=True. To handle this case, we

716

# it is only reordered when reorder=True. To handle this case, we

722

# simply take the slowpath, which already has the 'clrevorder' logic.

717

# simply take the slowpath, which already has the 'clrevorder' logic.

723

# This was also fixed in cc0ff93d0c0c.

718

# This was also fixed in cc0ff93d0c0c.

724

fastpathlinkrev = fastpathlinkrev and not self._reorder

719

fastpathlinkrev = fastpathlinkrev and not self._reorder

725

# Treemanifests don't work correctly with fastpathlinkrev

720

# Treemanifests don't work correctly with fastpathlinkrev

726

# either, because we don't discover which directory nodes to

721

# either, because we don't discover which directory nodes to

727

# send along with files. This could probably be fixed.

722

# send along with files. This could probably be fixed.

728

fastpathlinkrev = fastpathlinkrev and (

723

fastpathlinkrev = fastpathlinkrev and (

729

'treemanifest' not in repo.requirements)

724

'treemanifest' not in repo.requirements)

730

725

731

for chunk in self.generatemanifests(commonrevs, clrevorder,

726

for chunk in self.generatemanifests(commonrevs, clrevorder,

732

fastpathlinkrev, mfs, mfchangedfiles, fnodes):

727

fastpathlinkrev, mfs, mfchangedfiles, fnodes):

733

yield chunk

728

yield chunk

734

mfs.clear()

729

mfs.clear()

735

clrevs = set(cl.rev(x) for x in clnodes)

730

clrevs = set(cl.rev(x) for x in clnodes)

736

731

737

if not fastpathlinkrev:

732

if not fastpathlinkrev:

738

def linknodes(unused, fname):

733

def linknodes(unused, fname):

739

return fnodes.get(fname, {})

734

return fnodes.get(fname, {})

740

else:

735

else:

741

cln = cl.node

736

cln = cl.node

742

def linknodes(filerevlog, fname):

737

def linknodes(filerevlog, fname):

743

llr = filerevlog.linkrev

738

llr = filerevlog.linkrev

744

fln = filerevlog.node

739

fln = filerevlog.node

745

revs = ((r, llr(r)) for r in filerevlog)

740

revs = ((r, llr(r)) for r in filerevlog)

746

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

741

return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)

747

742

748

changedfiles = set()

743

changedfiles = set()

749

for x in mfchangedfiles.itervalues():

744

for x in mfchangedfiles.itervalues():

750

changedfiles.update(x)

745

changedfiles.update(x)

751

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

746

for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,

752

source):

747

source):

753

yield chunk

748

yield chunk

754

749

755

yield self.close()

750

yield self.close()

756

751

757

if clnodes:

752

if clnodes:

758

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

753

repo.hook('outgoing', node=hex(clnodes[0]), source=source)

759

754

760

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

755

def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,

761

mfchangedfiles, fnodes):

756

mfchangedfiles, fnodes):

762

repo = self._repo

757

repo = self._repo

763

ml = repo.manifest

758

ml = repo.manifest

764

tmfnodes = {}

759

tmfnodes = {}

765

760

766

# Callback for the manifest, used to collect linkrevs for filelog

761

# Callback for the manifest, used to collect linkrevs for filelog

767

# revisions.

762

# revisions.

768

# Returns the linkrev node (collected in lookupcl).

763

# Returns the linkrev node (collected in lookupcl).

769

if fastpathlinkrev:

764

if fastpathlinkrev:

770

lookupmflinknode = mfs.__getitem__

765

lookupmflinknode = mfs.__getitem__

771

else:

766

else:

772

def lookupmflinknode(x):

767

def lookupmflinknode(x):

773

"""Callback for looking up the linknode for manifests.

768

"""Callback for looking up the linknode for manifests.

774

769

775

Returns the linkrev node for the specified manifest.

770

Returns the linkrev node for the specified manifest.

776

771

777

SIDE EFFECT:

772

SIDE EFFECT:

778

773

779

1) fclnodes gets populated with the list of relevant

774

1) fclnodes gets populated with the list of relevant

780

file nodes if we're not using fastpathlinkrev

775

file nodes if we're not using fastpathlinkrev

781

2) When treemanifests are in use, collects treemanifest nodes

776

2) When treemanifests are in use, collects treemanifest nodes

782

to send

777

to send

783

778

784

Note that this means manifests must be completely sent to

779

Note that this means manifests must be completely sent to

785

the client before you can trust the list of files and

780

the client before you can trust the list of files and

786

treemanifests to send.

781

treemanifests to send.

787

"""

782

"""

788

clnode = mfs[x]

783

clnode = mfs[x]

789

# We no longer actually care about reading deltas of

784

# We no longer actually care about reading deltas of

790

# the manifest here, because we already know the list

785

# the manifest here, because we already know the list

791

# of changed files, so for treemanifests (which

786

# of changed files, so for treemanifests (which

792

# lazily-load anyway to *generate* a readdelta) we can

787

# lazily-load anyway to *generate* a readdelta) we can

793

# just load them with read() and then we'll actually

788

# just load them with read() and then we'll actually

794

# be able to correctly load node IDs from the

789

# be able to correctly load node IDs from the

795

# submanifest entries.

790

# submanifest entries.

796

if 'treemanifest' in repo.requirements:

791

if 'treemanifest' in repo.requirements:

797

mdata = ml.read(x)

792

mdata = ml.read(x)

798

else:

793

else:

799

mdata = ml.readfast(x)

794

mdata = ml.readfast(x)

800

for f in mfchangedfiles[x]:

795

for f in mfchangedfiles[x]:

801

try:

796

try:

802

n = mdata[f]

797

n = mdata[f]

803

except KeyError:

798

except KeyError:

804

continue

799

continue

805

# record the first changeset introducing this filelog

800

# record the first changeset introducing this filelog

806

# version

801

# version

807

fclnodes = fnodes.setdefault(f, {})

802

fclnodes = fnodes.setdefault(f, {})

808

fclnode = fclnodes.setdefault(n, clnode)

803

fclnode = fclnodes.setdefault(n, clnode)

809

if clrevorder[clnode] < clrevorder[fclnode]:

804

if clrevorder[clnode] < clrevorder[fclnode]:

810

fclnodes[n] = clnode

805

fclnodes[n] = clnode

811

# gather list of changed treemanifest nodes

806

# gather list of changed treemanifest nodes

812

if 'treemanifest' in repo.requirements:

807

if 'treemanifest' in repo.requirements:

813

submfs = {'/': mdata}

808

submfs = {'/': mdata}

814

for dn, bn in _moddirs(mfchangedfiles[x]):

809

for dn, bn in _moddirs(mfchangedfiles[x]):

815

try:

810

try:

816

submf = submfs[dn]

811

submf = submfs[dn]

817

submf = submf._dirs[bn]

812

submf = submf._dirs[bn]

818

except KeyError:

813

except KeyError:

819

continue # deleted directory, so nothing to send

814

continue # deleted directory, so nothing to send

820

submfs[submf.dir()] = submf

815

submfs[submf.dir()] = submf

821

tmfclnodes = tmfnodes.setdefault(submf.dir(), {})

816

tmfclnodes = tmfnodes.setdefault(submf.dir(), {})

822

tmfclnode = tmfclnodes.setdefault(submf._node, clnode)

817

tmfclnode = tmfclnodes.setdefault(submf._node, clnode)

823

if clrevorder[clnode] < clrevorder[tmfclnode]:

818

if clrevorder[clnode] < clrevorder[tmfclnode]:

824

tmfclnodes[n] = clnode

819

tmfclnodes[n] = clnode

825

return clnode

820

return clnode

826

821

827

mfnodes = self.prune(ml, mfs, commonrevs)

822

mfnodes = self.prune(ml, mfs, commonrevs)

828

for x in self._packmanifests(

823

size = 0

829

~~mfnodes~~, tmfnodes, lookupmflinknode):

824

for x in self._packmanifests('', mfnodes, lookupmflinknode):

825

size += len(x)

830

yield x

826

yield x

827

self._verbosenote(_('%8.i (manifests)\n') % size)

828

for dir, nodes in tmfnodes.iteritems():

829

for x in self._packmanifests(dir, nodes, nodes.get):

830

yield x

831

yield self._manifestsdone()

831

832

# The 'source' parameter is useful for extensions

833

# The 'source' parameter is useful for extensions

833

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

834

def generatefiles(self, changedfiles, linknodes, commonrevs, source):

834

repo = self._repo

835

repo = self._repo

835

progress = self._progress

836

progress = self._progress

836

msgbundling = _('bundling')

837

msgbundling = _('bundling')

837

838

total = len(changedfiles)

839

total = len(changedfiles)

839

# for progress output

840

# for progress output

840

msgfiles = _('files')

841

msgfiles = _('files')

841

for i, fname in enumerate(sorted(changedfiles)):

842

for i, fname in enumerate(sorted(changedfiles)):

842

filerevlog = repo.file(fname)

843

filerevlog = repo.file(fname)

843

if not filerevlog:

844

if not filerevlog:

844

raise error.Abort(_("empty or missing revlog for %s") % fname)

845

raise error.Abort(_("empty or missing revlog for %s") % fname)

845

846

linkrevnodes = linknodes(filerevlog, fname)

847

linkrevnodes = linknodes(filerevlog, fname)

847

# Lookup for filenodes, we collected the linkrev nodes above in the

848

# Lookup for filenodes, we collected the linkrev nodes above in the

848

# fastpath case and with lookupmf in the slowpath case.

849

# fastpath case and with lookupmf in the slowpath case.

849

def lookupfilelog(x):

850

def lookupfilelog(x):

850

return linkrevnodes[x]

851

return linkrevnodes[x]

851

852

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

853

filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)

853

if filenodes:

854

if filenodes:

854

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

855

progress(msgbundling, i + 1, item=fname, unit=msgfiles,

855

total=total)

856

total=total)

856

h = self.fileheader(fname)

857

h = self.fileheader(fname)

857

size = len(h)

858

size = len(h)

858

yield h

859

yield h

859

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

860

for chunk in self.group(filenodes, filerevlog, lookupfilelog):

860

size += len(chunk)

861

size += len(chunk)

861

yield chunk

862

yield chunk

862

self._verbosenote(_('%8.i %s\n') % (size, fname))

863

self._verbosenote(_('%8.i %s\n') % (size, fname))

863

progress(msgbundling, None)

864

progress(msgbundling, None)

864

865

def deltaparent(self, revlog, rev, p1, p2, prev):

866

def deltaparent(self, revlog, rev, p1, p2, prev):

866

return prev

867

return prev

867

868

def revchunk(self, revlog, rev, prev, linknode):

869

def revchunk(self, revlog, rev, prev, linknode):

869

node = revlog.node(rev)

870

node = revlog.node(rev)

870

p1, p2 = revlog.parentrevs(rev)

871

p1, p2 = revlog.parentrevs(rev)

871

base = self.deltaparent(revlog, rev, p1, p2, prev)

872

base = self.deltaparent(revlog, rev, p1, p2, prev)

872

873

prefix = ''

874

prefix = ''

874

if revlog.iscensored(base) or revlog.iscensored(rev):

875

if revlog.iscensored(base) or revlog.iscensored(rev):

875

try:

876

try:

876

delta = revlog.revision(node)

877

delta = revlog.revision(node)

877

except error.CensoredNodeError as e:

878

except error.CensoredNodeError as e:

878

delta = e.tombstone

879

delta = e.tombstone

879

if base == nullrev:

880

if base == nullrev:

880

prefix = mdiff.trivialdiffheader(len(delta))

881

prefix = mdiff.trivialdiffheader(len(delta))

881

else:

882

else:

882

baselen = revlog.rawsize(base)

883

baselen = revlog.rawsize(base)

883

prefix = mdiff.replacediffheader(baselen, len(delta))

884

prefix = mdiff.replacediffheader(baselen, len(delta))

884

elif base == nullrev:

885

elif base == nullrev:

885

delta = revlog.revision(node)

886

delta = revlog.revision(node)

886

prefix = mdiff.trivialdiffheader(len(delta))

887

prefix = mdiff.trivialdiffheader(len(delta))

887

else:

888

else:

888

delta = revlog.revdiff(base, rev)

889

delta = revlog.revdiff(base, rev)

889

p1n, p2n = revlog.parents(node)

890

p1n, p2n = revlog.parents(node)

890

basenode = revlog.node(base)

891

basenode = revlog.node(base)

891

flags = revlog.flags(rev)

892

flags = revlog.flags(rev)

892

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)

893

meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)

893

meta += prefix

894

meta += prefix

894

l = len(meta) + len(delta)

895

l = len(meta) + len(delta)

895

yield chunkheader(l)

896

yield chunkheader(l)

896

yield meta

897

yield meta

897

yield delta

898

yield delta

898

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

899

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

899

# do nothing with basenode, it is implicitly the previous one in HG10

900

# do nothing with basenode, it is implicitly the previous one in HG10

900

# do nothing with flags, it is implicitly 0 for cg1 and cg2

901

# do nothing with flags, it is implicitly 0 for cg1 and cg2

901

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

902

return struct.pack(self.deltaheader, node, p1n, p2n, linknode)

902

903

class cg2packer(cg1packer):

904

class cg2packer(cg1packer):

904

version = '02'

905

version = '02'

905

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

906

deltaheader = _CHANGEGROUPV2_DELTA_HEADER

906

907

def __init__(self, repo, bundlecaps=None):

908

def __init__(self, repo, bundlecaps=None):

908

super(cg2packer, self).__init__(repo, bundlecaps)

909

super(cg2packer, self).__init__(repo, bundlecaps)

909

if self._reorder is None:

910

if self._reorder is None:

910

# Since generaldelta is directly supported by cg2, reordering

911

# Since generaldelta is directly supported by cg2, reordering

911

# generally doesn't help, so we disable it by default (treating

912

# generally doesn't help, so we disable it by default (treating

912

# bundle.reorder=auto just like bundle.reorder=False).

913

# bundle.reorder=auto just like bundle.reorder=False).

913

self._reorder = False

914

self._reorder = False

914

915

def deltaparent(self, revlog, rev, p1, p2, prev):

916

def deltaparent(self, revlog, rev, p1, p2, prev):

916

dp = revlog.deltaparent(rev)

917

dp = revlog.deltaparent(rev)

917

# avoid storing full revisions; pick prev in those cases

918

# avoid storing full revisions; pick prev in those cases

918

# also pick prev when we can't be sure remote has dp

919

# also pick prev when we can't be sure remote has dp

919

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

920

if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):

920

return prev

921

return prev

921

return dp

922

return dp

922

923

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

924

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

924

# Do nothing with flags, it is implicitly 0 in cg1 and cg2

925

# Do nothing with flags, it is implicitly 0 in cg1 and cg2

925

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

926

return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)

926

927

class cg3packer(cg2packer):

928

class cg3packer(cg2packer):

928

version = '03'

929

version = '03'

929

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

930

deltaheader = _CHANGEGROUPV3_DELTA_HEADER

930

931

def _packmanifests(self, ~~mfnodes~~, tmfnodes, lookuplinknode):

932

def _packmanifests(self, dir, mfnodes, lookuplinknode):

932

# Note that debug prints are super confusing in this code, as

933

if dir:

933

# tmfnodes gets populated by the calls to lookuplinknode in

934

yield self.fileheader(dir)

934

# the superclass's manifest packer. In the future we should

935

for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),

935

# probably see if we can refactor this somehow to be less

936

lookuplinknode, units=_('manifests')):

936

# confusing.

937

yield chunk

937

for x in super(cg3packer, self)._packmanifests(

938

mfnodes, {}, lookuplinknode):

939

def _manifestsdone(self):

939

yield x

940

return self.close()

940

dirlog = self._repo.manifest.dirlog

941

for name, nodes in tmfnodes.iteritems():

942

# For now, directory headers are simply file headers with

943

# a trailing '/' on the path (already in the name).

944

yield self.fileheader(name)

945

for chunk in self.group(nodes, dirlog(name), nodes.get):

946

yield chunk

947

yield self.close()

948

941

949

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

942

def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):

950

return struct.pack(

943

return struct.pack(

951

self.deltaheader, node, p1n, p2n, basenode, linknode, flags)

944

self.deltaheader, node, p1n, p2n, basenode, linknode, flags)

952

945

953

_packermap = {'01': (cg1packer, cg1unpacker),

946

_packermap = {'01': (cg1packer, cg1unpacker),

954

# cg2 adds support for exchanging generaldelta

947

# cg2 adds support for exchanging generaldelta

955

'02': (cg2packer, cg2unpacker),

948

'02': (cg2packer, cg2unpacker),

956

# cg3 adds support for exchanging revlog flags and treemanifests

949

# cg3 adds support for exchanging revlog flags and treemanifests

957

'03': (cg3packer, cg3unpacker),

950

'03': (cg3packer, cg3unpacker),

958

}

951

}

959

952

960

def allsupportedversions(ui):

953

def allsupportedversions(ui):

961

versions = set(_packermap.keys())

954

versions = set(_packermap.keys())

962

versions.discard('03')

955

versions.discard('03')

963

if (ui.configbool('experimental', 'changegroup3') or

956

if (ui.configbool('experimental', 'changegroup3') or

964

ui.configbool('experimental', 'treemanifest')):

957

ui.configbool('experimental', 'treemanifest')):

965

versions.add('03')

958

versions.add('03')

966

return versions

959

return versions

967

960

968

# Changegroup versions that can be applied to the repo

961

# Changegroup versions that can be applied to the repo

969

def supportedincomingversions(repo):

962

def supportedincomingversions(repo):

970

versions = allsupportedversions(repo.ui)

963

versions = allsupportedversions(repo.ui)

971

if 'treemanifest' in repo.requirements:

964

if 'treemanifest' in repo.requirements:

972

versions.add('03')

965

versions.add('03')

973

return versions

966

return versions

974

967

975

# Changegroup versions that can be created from the repo

968

# Changegroup versions that can be created from the repo

976

def supportedoutgoingversions(repo):

969

def supportedoutgoingversions(repo):

977

versions = allsupportedversions(repo.ui)

970

versions = allsupportedversions(repo.ui)

978

if 'treemanifest' in repo.requirements:

971

if 'treemanifest' in repo.requirements:

979

# Versions 01 and 02 support only flat manifests and it's just too

972

# Versions 01 and 02 support only flat manifests and it's just too

980

# expensive to convert between the flat manifest and tree manifest on

973

# expensive to convert between the flat manifest and tree manifest on

981

# the fly. Since tree manifests are hashed differently, all of history

974

# the fly. Since tree manifests are hashed differently, all of history

982

# would have to be converted. Instead, we simply don't even pretend to

975

# would have to be converted. Instead, we simply don't even pretend to

983

# support versions 01 and 02.

976

# support versions 01 and 02.

984

versions.discard('01')

977

versions.discard('01')

985

versions.discard('02')

978

versions.discard('02')

986

versions.add('03')

979

versions.add('03')

987

return versions

980

return versions

988

981

989

def safeversion(repo):

982

def safeversion(repo):

990

# Finds the smallest version that it's safe to assume clients of the repo

983

# Finds the smallest version that it's safe to assume clients of the repo

991

# will support. For example, all hg versions that support generaldelta also

984

# will support. For example, all hg versions that support generaldelta also

992

# support changegroup 02.

985

# support changegroup 02.

993

versions = supportedoutgoingversions(repo)

986

versions = supportedoutgoingversions(repo)

994

if 'generaldelta' in repo.requirements:

987

if 'generaldelta' in repo.requirements:

995

versions.discard('01')

988

versions.discard('01')

996

assert versions

989

assert versions

997

return min(versions)

990

return min(versions)

998

991

999

def getbundler(version, repo, bundlecaps=None):

992

def getbundler(version, repo, bundlecaps=None):

1000

assert version in supportedoutgoingversions(repo)

993

assert version in supportedoutgoingversions(repo)

1001

return _packermap[version][0](repo, bundlecaps)

994

return _packermap[version][0](repo, bundlecaps)

1002

995

1003

def getunbundler(version, fh, alg):

996

def getunbundler(version, fh, alg):

1004

return _packermap[version][1](fh, alg)

997

return _packermap[version][1](fh, alg)

1005

998

1006

def _changegroupinfo(repo, nodes, source):

999

def _changegroupinfo(repo, nodes, source):

1007

if repo.ui.verbose or source == 'bundle':

1000

if repo.ui.verbose or source == 'bundle':

1008

repo.ui.status(_("%d changesets found\n") % len(nodes))

1001

repo.ui.status(_("%d changesets found\n") % len(nodes))

1009

if repo.ui.debugflag:

1002

if repo.ui.debugflag:

1010

repo.ui.debug("list of changesets:\n")

1003

repo.ui.debug("list of changesets:\n")

1011

for node in nodes:

1004

for node in nodes:

1012

repo.ui.debug("%s\n" % hex(node))

1005

repo.ui.debug("%s\n" % hex(node))

1013

1006

1014

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

1007

def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):

1015

repo = repo.unfiltered()

1008

repo = repo.unfiltered()

1016

commonrevs = outgoing.common

1009

commonrevs = outgoing.common

1017

csets = outgoing.missing

1010

csets = outgoing.missing

1018

heads = outgoing.missingheads

1011

heads = outgoing.missingheads

1019

# We go through the fast path if we get told to, or if all (unfiltered

1012

# We go through the fast path if we get told to, or if all (unfiltered

1020

# heads have been requested (since we then know there all linkrevs will

1013

# heads have been requested (since we then know there all linkrevs will

1021

# be pulled by the client).

1014

# be pulled by the client).

1022

heads.sort()

1015

heads.sort()

1023

fastpathlinkrev = fastpath or (

1016

fastpathlinkrev = fastpath or (

1024

repo.filtername is None and heads == sorted(repo.heads()))

1017

repo.filtername is None and heads == sorted(repo.heads()))

1025

1018

1026

repo.hook('preoutgoing', throw=True, source=source)

1019

repo.hook('preoutgoing', throw=True, source=source)

1027

_changegroupinfo(repo, csets, source)

1020

_changegroupinfo(repo, csets, source)

1028

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1021

return bundler.generate(commonrevs, csets, fastpathlinkrev, source)

1029

1022

1030

def getsubset(repo, outgoing, bundler, source, fastpath=False):

1023

def getsubset(repo, outgoing, bundler, source, fastpath=False):

1031

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

1024

gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)

1032

return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)

1025

return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)

1033

1026

1034

def changegroupsubset(repo, roots, heads, source, version='01'):

1027

def changegroupsubset(repo, roots, heads, source, version='01'):

1035

"""Compute a changegroup consisting of all the nodes that are

1028

"""Compute a changegroup consisting of all the nodes that are

1036

descendants of any of the roots and ancestors of any of the heads.

1029

descendants of any of the roots and ancestors of any of the heads.

1037

Return a chunkbuffer object whose read() method will return

1030

Return a chunkbuffer object whose read() method will return

1038

successive changegroup chunks.

1031

successive changegroup chunks.

1039

1032

1040

It is fairly complex as determining which filenodes and which

1033

It is fairly complex as determining which filenodes and which

1041

manifest nodes need to be included for the changeset to be complete

1034

manifest nodes need to be included for the changeset to be complete

1042

is non-trivial.

1035

is non-trivial.

1043

1036

1044

Another wrinkle is doing the reverse, figuring out which changeset in

1037

Another wrinkle is doing the reverse, figuring out which changeset in

1045

the changegroup a particular filenode or manifestnode belongs to.

1038

the changegroup a particular filenode or manifestnode belongs to.

1046

"""

1039

"""

1047

cl = repo.changelog

1040

cl = repo.changelog

1048

if not roots:

1041

if not roots:

1049

roots = [nullid]

1042

roots = [nullid]

1050

discbases = []

1043

discbases = []

1051

for n in roots:

1044

for n in roots:

1052

discbases.extend([p for p in cl.parents(n) if p != nullid])

1045

discbases.extend([p for p in cl.parents(n) if p != nullid])

1053

# TODO: remove call to nodesbetween.

1046

# TODO: remove call to nodesbetween.

1054

csets, roots, heads = cl.nodesbetween(roots, heads)

1047

csets, roots, heads = cl.nodesbetween(roots, heads)

1055

included = set(csets)

1048

included = set(csets)

1056

discbases = [n for n in discbases if n not in included]

1049

discbases = [n for n in discbases if n not in included]

1057

outgoing = discovery.outgoing(cl, discbases, heads)

1050

outgoing = discovery.outgoing(cl, discbases, heads)

1058

bundler = getbundler(version, repo)

1051

bundler = getbundler(version, repo)

1059

return getsubset(repo, outgoing, bundler, source)

1052

return getsubset(repo, outgoing, bundler, source)

1060

1053

1061

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

1054

def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,

1062

version='01'):

1055

version='01'):

1063

"""Like getbundle, but taking a discovery.outgoing as an argument.

1056

"""Like getbundle, but taking a discovery.outgoing as an argument.

1064

1057

1065

This is only implemented for local repos and reuses potentially

1058

This is only implemented for local repos and reuses potentially

1066

precomputed sets in outgoing. Returns a raw changegroup generator."""

1059

precomputed sets in outgoing. Returns a raw changegroup generator."""

1067

if not outgoing.missing:

1060

if not outgoing.missing:

1068

return None

1061

return None

1069

bundler = getbundler(version, repo, bundlecaps)

1062

bundler = getbundler(version, repo, bundlecaps)

1070

return getsubsetraw(repo, outgoing, bundler, source)

1063

return getsubsetraw(repo, outgoing, bundler, source)

1071

1064

1072

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

1065

def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,

1073

version='01'):

1066

version='01'):

1074

"""Like getbundle, but taking a discovery.outgoing as an argument.

1067

"""Like getbundle, but taking a discovery.outgoing as an argument.

1075

1068

1076

This is only implemented for local repos and reuses potentially

1069

This is only implemented for local repos and reuses potentially

1077

precomputed sets in outgoing."""

1070

precomputed sets in outgoing."""

1078

if not outgoing.missing:

1071

if not outgoing.missing:

1079

return None

1072

return None

1080

bundler = getbundler(version, repo, bundlecaps)

1073

bundler = getbundler(version, repo, bundlecaps)

1081

return getsubset(repo, outgoing, bundler, source)

1074

return getsubset(repo, outgoing, bundler, source)

1082

1075

1083

def computeoutgoing(repo, heads, common):

1076

def computeoutgoing(repo, heads, common):

1084

"""Computes which revs are outgoing given a set of common

1077

"""Computes which revs are outgoing given a set of common

1085

and a set of heads.

1078

and a set of heads.

1086

1079

1087

This is a separate function so extensions can have access to

1080

This is a separate function so extensions can have access to

1088

the logic.

1081

the logic.

1089

1082

1090

Returns a discovery.outgoing object.

1083

Returns a discovery.outgoing object.

1091

"""

1084

"""

1092

cl = repo.changelog

1085

cl = repo.changelog

1093

if common:

1086

if common:

1094

hasnode = cl.hasnode

1087

hasnode = cl.hasnode

1095

common = [n for n in common if hasnode(n)]

1088

common = [n for n in common if hasnode(n)]

1096

else:

1089

else:

1097

common = [nullid]

1090

common = [nullid]

1098

if not heads:

1091

if not heads:

1099

heads = cl.heads()

1092

heads = cl.heads()

1100

return discovery.outgoing(cl, common, heads)

1093

return discovery.outgoing(cl, common, heads)

1101

1094

1102

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

1095

def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,

1103

version='01'):

1096

version='01'):

1104

"""Like changegroupsubset, but returns the set difference between the

1097

"""Like changegroupsubset, but returns the set difference between the

1105

ancestors of heads and the ancestors common.

1098

ancestors of heads and the ancestors common.

1106

1099

1107

If heads is None, use the local heads. If common is None, use [nullid].

1100

If heads is None, use the local heads. If common is None, use [nullid].

1108

1101

1109

The nodes in common might not all be known locally due to the way the

1102

The nodes in common might not all be known locally due to the way the

1110

current discovery protocol works.

1103

current discovery protocol works.

1111

"""

1104

"""

1112

outgoing = computeoutgoing(repo, heads, common)

1105

outgoing = computeoutgoing(repo, heads, common)

1113

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

1106

return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,

1114

version=version)

1107

version=version)

1115

1108

1116

def changegroup(repo, basenodes, source):

1109

def changegroup(repo, basenodes, source):

1117

# to avoid a race we use changegroupsubset() (issue1320)

1110

# to avoid a race we use changegroupsubset() (issue1320)

1118

return changegroupsubset(repo, basenodes, repo.heads(), source)

1111

return changegroupsubset(repo, basenodes, repo.heads(), source)

1119

1112

1120

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

1113

def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):

1121

revisions = 0

1114

revisions = 0

1122

files = 0

1115

files = 0

1123

while True:

1116

while True:

1124

chunkdata = source.filelogheader()

1117

chunkdata = source.filelogheader()

1125

if not chunkdata:

1118

if not chunkdata:

1126

break

1119

break

1127

f = chunkdata["filename"]

1120

f = chunkdata["filename"]

1128

repo.ui.debug("adding %s revisions\n" % f)

1121

repo.ui.debug("adding %s revisions\n" % f)

1129

pr()

1122

pr()

1130

fl = repo.file(f)

1123

fl = repo.file(f)

1131

o = len(fl)

1124

o = len(fl)

1132

try:

1125

try:

1133

if not fl.addgroup(source, revmap, trp):

1126

if not fl.addgroup(source, revmap, trp):

1134

raise error.Abort(_("received file revlog group is empty"))

1127

raise error.Abort(_("received file revlog group is empty"))

1135

except error.CensoredBaseError as e:

1128

except error.CensoredBaseError as e:

1136

raise error.Abort(_("received delta base is censored: %s") % e)

1129

raise error.Abort(_("received delta base is censored: %s") % e)

1137

revisions += len(fl) - o

1130

revisions += len(fl) - o

1138

files += 1

1131

files += 1

1139

if f in needfiles:

1132

if f in needfiles:

1140

needs = needfiles[f]

1133

needs = needfiles[f]

1141

for new in xrange(o, len(fl)):

1134

for new in xrange(o, len(fl)):

1142

n = fl.node(new)

1135

n = fl.node(new)

1143

if n in needs:

1136

if n in needs:

1144

needs.remove(n)

1137

needs.remove(n)

1145

else:

1138

else:

1146

raise error.Abort(

1139

raise error.Abort(

1147

_("received spurious file revlog entry"))

1140

_("received spurious file revlog entry"))

1148

if not needs:

1141

if not needs:

1149

del needfiles[f]

1142

del needfiles[f]

1150

repo.ui.progress(_('files'), None)

1143

repo.ui.progress(_('files'), None)

1151

1144

1152

for f, needs in needfiles.iteritems():

1145

for f, needs in needfiles.iteritems():

1153

fl = repo.file(f)

1146

fl = repo.file(f)

1154

for n in needs:

1147

for n in needs:

1155

try:

1148

try:

1156

fl.rev(n)

1149

fl.rev(n)

1157

except error.LookupError:

1150

except error.LookupError:

1158

raise error.Abort(

1151

raise error.Abort(

1159

_('missing file data for %s:%s - run hg verify') %

1152

_('missing file data for %s:%s - run hg verify') %

1160

(f, hex(n)))

1153

(f, hex(n)))

1161

1154

1162

return revisions, files

1155

return revisions, files

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import struct
             import tempfile
             import weakref
             from .i18n import _
             from .node import (
                 hex,
                 nullid,
                 nullrev,
                 short,
             )
             from . import (
                 branchmap,
                 dagutil,
                 discovery,
                 error,
                 mdiff,
                 phases,
                 util,
             )
             _CHANGEGROUPV1_DELTA_HEADER = "20s20s20s20s"
             _CHANGEGROUPV2_DELTA_HEADER = "20s20s20s20s20s"
             _CHANGEGROUPV3_DELTA_HEADER = ">20s20s20s20s20sH"
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def getchunk(stream):
                 """return the next chunk from stream as a string"""
                 d = readexactly(stream, 4)
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     if l:
                         raise error.Abort(_("invalid chunk length %d") % l)
                     return ""
                 return readexactly(stream, l - 4)
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             def combineresults(results):
                 """logic to combine 0 or more addchangegroup results into one"""
                 changedheads = 0
                 result = 1
                 for ret in results:
                     # If any changegroup result is 0, return 0
                     if ret == 0:
                         result = 0
                         break
                     if ret < -1:
                         changedheads += ret + 1
                     elif ret > 1:
                         changedheads += ret - 1
                 if changedheads > 0:
                     result = 1 + changedheads
                 elif changedheads < 0:
                     result = -1 + changedheads
                 return result
             bundletypes = {
                 "": ("", None),       # only when using unbundle on ssh and old http servers
                                       # since the unification ssh accepts a header but there
                                       # is no capability signaling it.
                 "HG20": (), # special-cased below
                 "HG10UN": ("HG10UN", None),
                 "HG10BZ": ("HG10", 'BZ'),
                 "HG10GZ": ("HG10GZ", 'GZ'),
             }
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writechunks(ui, chunks, filename, vfs=None):
                 """Write chunks to a file and return its filename.
                 The stream is assumed to be a bundle file.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         if vfs:
                             fh = vfs.open(filename, "wb")
                         else:
                             fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     for c in chunks:
                         fh.write(c)
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         if filename and vfs:
                             vfs.unlink(cleanup)
                         else:
                             os.unlink(cleanup)
             def writebundle(ui, cg, filename, bundletype, vfs=None, compression=None):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 if bundletype == "HG20":
                     from . import bundle2
                     bundle = bundle2.bundle20(ui)
                     bundle.setcompression(compression)
                     part = bundle.newpart('changegroup', data=cg.getchunks())
                     part.addparam('version', cg.version)
                     chunkiter = bundle.getchunks()
                 else:
                     # compression argument is only for the bundle2 case
                     assert compression is None
                     if cg.version != '01':
                         raise error.Abort(_('old bundle types only supports v1 '
                                             'changegroups'))
                     header, comp = bundletypes[bundletype]
                     if comp not in util.compressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                           % comp)
                     z = util.compressors[comp]()
                     subchunkiter = cg.getchunks()
                     def chunkiter():
                         yield header
                         for chunk in subchunkiter:
                             yield z.compress(chunk)
                         yield z.flush()
                     chunkiter = chunkiter()
                 # parse the changegroup data, otherwise we will block
                 # in case of sshrepo because we don't know the end of the stream
                 # an empty chunkgroup is the end of the changegroup
                 # a changegroup has at least 2 chunkgroups (changelog and manifest).
                 # after that, an empty chunkgroup is the end of the changegroup
                 return writechunks(ui, chunkiter, filename, vfs=vfs)
             class cg1unpacker(object):
                 """Unpacker for cg1 changegroup streams.
                 A changegroup unpacker handles the framing of the revision data in
                 the wire format. Most consumers will want to use the apply()
                 method to add the changes from the changegroup to a repository.
                 If you're forwarding a changegroup unmodified to another consumer,
                 use getchunks(), which returns an iterator of changegroup
                 chunks. This is mostly useful for cases where you need to know the
                 data stream has ended by observing the end of the changegroup.
                 deltachunk() is useful only if you're applying delta data. Most
                 consumers should prefer apply() instead.
                 A few other public methods exist. Those are used only for
                 bundlerepo and some debug commands - their use is discouraged.
                 """
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '01'
                 _grouplistcount = 1 # One list of files after the manifests
                 def __init__(self, fh, alg):
                     if alg == 'UN':
                         alg = None # get more modern without breaking too much
                     if not alg in util.decompressors:
                         raise error.Abort(_('unknown stream compression type: %s')
                                          % alg)
                     if alg == 'BZ':
                         alg = '_truncatedBZ'
                     self._stream = util.decompressors[alg](fh)
                     self._type = alg
                     self.callback = None
                 # These methods (compressed, read, seek, tell) all appear to only
                 # be used by bundlerepo, but it's a little hard to tell.
                 def compressed(self):
                     return self._type is not None
                 def read(self, l):
                     return self._stream.read(l)
                 def seek(self, pos):
                     return self._stream.seek(pos)
                 def tell(self):
                     return self._stream.tell()
                 def close(self):
                     return self._stream.close()
                 def _chunklength(self):
                     d = readexactly(self._stream, 4)
                     l = struct.unpack(">l", d)[0]
                     if l <= 4:
                         if l:
                             raise error.Abort(_("invalid chunk length %d") % l)
                         return 0
                     if self.callback:
                         self.callback()
                     return l - 4
                 def changelogheader(self):
                     """v10 does not have a changelog header chunk"""
                     return {}
                 def manifestheader(self):
                     """v10 does not have a manifest header chunk"""
                     return {}
                 def filelogheader(self):
                     """return the header of the filelogs chunk, v10 only has the filename"""
                     l = self._chunklength()
                     if not l:
                         return {}
                     fname = readexactly(self._stream, l)
                     return {'filename': fname}
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, cs = headertuple
                     if prevnode is None:
                         deltabase = p1
                     else:
                         deltabase = prevnode
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
                 def deltachunk(self, prevnode):
                     l = self._chunklength()
                     if not l:
                         return {}
                     headerdata = readexactly(self._stream, self.deltaheadersize)
                     header = struct.unpack(self.deltaheader, headerdata)
                     delta = readexactly(self._stream, l - self.deltaheadersize)
                     node, p1, p2, deltabase, cs, flags = self._deltaheader(header, prevnode)
                     return {'node': node, 'p1': p1, 'p2': p2, 'cs': cs,
                             'deltabase': deltabase, 'delta': delta, 'flags': flags}
                 def getchunks(self):
                     """returns all the chunks contains in the bundle
                     Used when you need to forward the binary stream to a file or another
                     network API. To do so, it parse the changegroup data, otherwise it will
                     block in case of sshrepo because it don't know the end of the stream.
                     """
                     # an empty chunkgroup is the end of the changegroup
                     # a changegroup has at least 2 chunkgroups (changelog and manifest).
                     # after that, changegroup versions 1 and 2 have a series of groups
                     # with one group per file. changegroup 3 has a series of directory
                     # manifests before the files.
                     count = 0
                     emptycount = 0
                     while emptycount < self._grouplistcount:
                         empty = True
                         count += 1
                         while True:
                             chunk = getchunk(self)
                             if not chunk:
                                 if empty and count > 2:
                                     emptycount += 1
                                 break
                             empty = False
                             yield chunkheader(len(chunk))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 yield chunk[pos:next]
                                 pos = next
                         yield closechunk()
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     # We know that we'll never have more manifests than we had
                     # changesets.
                     self.callback = prog(_('manifests'), numchanges)
                     # no need to check for empty manifest group here:
                     # if the result of the merge of 1 and 2 is the same in 3 and 4,
                     # no new manifest will be created and the manifest group will
                     # be empty during the pull
                     self.manifestheader()
                     repo.manifest.addgroup(self, revmap, trp)
                     repo.ui.progress(_('manifests'), None)
                 def apply(self, repo, srctype, url, emptyok=False,
                           targetphase=phases.draft, expectedtotal=None):
                     """Add the changegroup returned by source.read() to this repo.
                     srctype is a string like 'push', 'pull', or 'unbundle'.  url is
                     the URL of the repo where this changegroup is coming from.
                     Return an integer summarizing the change to this repo:
                     - nothing changed or no source: 0
                     - more heads than before: 1+added heads (2..n)
                     - fewer heads than before: -1-removed heads (-2..-n)
                     - number of heads stays the same: 1
                     """
                     repo = repo.unfiltered()
                     def csmap(x):
                         repo.ui.debug("add changeset %s\n" % short(x))
                         return len(cl)
                     def revmap(x):
                         return cl.rev(x)
                     changesets = files = revisions = 0
                     try:
                         with repo.transaction("\n".join([srctype,
                                                          util.hidepassword(url)])) as tr:
                             # The transaction could have been created before and already
                             # carries source information. In this case we use the top
                             # level data. We overwrite the argument because we need to use
                             # the top level value (if they exist) in this function.
                             srctype = tr.hookargs.setdefault('source', srctype)
                             url = tr.hookargs.setdefault('url', url)
                             repo.hook('prechangegroup', throw=True, **tr.hookargs)
                             # write changelog data to temp files so concurrent readers
                             # will not see an inconsistent view
                             cl = repo.changelog
                             cl.delayupdate(tr)
                             oldheads = cl.heads()
                             trp = weakref.proxy(tr)
                             # pull off the changeset group
                             repo.ui.status(_("adding changesets\n"))
                             clstart = len(cl)
                             class prog(object):
                                 def __init__(self, step, total):
                                     self._step = step
                                     self._total = total
                                     self._count = 1
                                 def __call__(self):
                                     repo.ui.progress(self._step, self._count,
                                                      unit=_('chunks'), total=self._total)
                                     self._count += 1
                             self.callback = prog(_('changesets'), expectedtotal)
                             efiles = set()
                             def onchangelog(cl, node):
                                 efiles.update(cl.read(node)[3])
                             self.changelogheader()
                             srccontent = cl.addgroup(self, csmap, trp,
                                                      addrevisioncb=onchangelog)
                             efiles = len(efiles)
                             if not (srccontent or emptyok):
                                 raise error.Abort(_("received changelog group is empty"))
                             clend = len(cl)
                             changesets = clend - clstart
                             repo.ui.progress(_('changesets'), None)
                             # pull off the manifest group
                             repo.ui.status(_("adding manifests\n"))
                             self._unpackmanifests(repo, revmap, trp, prog, changesets)
                             needfiles = {}
                             if repo.ui.configbool('server', 'validate', default=False):
                                 # validate incoming csets have their manifests
                                 for cset in xrange(clstart, clend):
                                     mfnode = repo.changelog.read(
                                         repo.changelog.node(cset))[0]
                                     mfest = repo.manifest.readdelta(mfnode)
                                     # store file nodes we must see
                                     for f, n in mfest.iteritems():
                                         needfiles.setdefault(f, set()).add(n)
                             # process the files
                             repo.ui.status(_("adding file changes\n"))
                             self.callback = None
                             pr = prog(_('files'), efiles)
                             newrevs, newfiles = _addchangegroupfiles(
                                 repo, self, revmap, trp, pr, needfiles)
                             revisions += newrevs
                             files += newfiles
                             dh = 0
                             if oldheads:
                                 heads = cl.heads()
                                 dh = len(heads) - len(oldheads)
                                 for h in heads:
                                     if h not in oldheads and repo[h].closesbranch():
                                         dh -= 1
                             htext = ""
                             if dh:
                                 htext = _(" (%+d heads)") % dh
                             repo.ui.status(_("added %d changesets"
                                              " with %d changes to %d files%s\n")
                                              % (changesets, revisions, files, htext))
                             repo.invalidatevolatilesets()
                             if changesets > 0:
                                 if 'node' not in tr.hookargs:
                                     tr.hookargs['node'] = hex(cl.node(clstart))
                                     tr.hookargs['node_last'] = hex(cl.node(clend - 1))
                                     hookargs = dict(tr.hookargs)
                                 else:
                                     hookargs = dict(tr.hookargs)
                                     hookargs['node'] = hex(cl.node(clstart))
                                     hookargs['node_last'] = hex(cl.node(clend - 1))
                                 repo.hook('pretxnchangegroup', throw=True, **hookargs)
                             added = [cl.node(r) for r in xrange(clstart, clend)]
                             publishing = repo.publishing()
                             if srctype in ('push', 'serve'):
                                 # Old servers can not push the boundary themselves.
                                 # New servers won't push the boundary if changeset already
                                 # exists locally as secret
                                 #
                                 # We should not use added here but the list of all change in
                                 # the bundle
                                 if publishing:
                                     phases.advanceboundary(repo, tr, phases.public,
                                                            srccontent)
                                 else:
                                     # Those changesets have been pushed from the
                                     # outside, their phases are going to be pushed
                                     # alongside. Therefor `targetphase` is
                                     # ignored.
                                     phases.advanceboundary(repo, tr, phases.draft,
                                                            srccontent)
                                     phases.retractboundary(repo, tr, phases.draft, added)
                             elif srctype != 'strip':
                                 # publishing only alter behavior during push
                                 #
                                 # strip should not touch boundary at all
                                 phases.retractboundary(repo, tr, targetphase, added)
                             if changesets > 0:
                                 if srctype != 'strip':
                                     # During strip, branchcache is invalid but
                                     # coming call to `destroyed` will repair it.
                                     # In other case we can safely update cache on
                                     # disk.
                                     branchmap.updatecache(repo.filtered('served'))
                                 def runhooks():
                                     # These hooks run when the lock releases, not when the
                                     # transaction closes. So it's possible for the changelog
                                     # to have changed since we last saw it.
                                     if clstart >= len(repo):
                                         return
                                     # forcefully update the on-disk branch cache
                                     repo.ui.debug("updating the branch cache\n")
                                     repo.hook("changegroup", **hookargs)
                                     for n in added:
                                         args = hookargs.copy()
                                         args['node'] = hex(n)
                                         del args['node_last']
                                         repo.hook("incoming", **args)
                                     newheads = [h for h in repo.heads()
                                                 if h not in oldheads]
                                     repo.ui.log("incoming",
                                                 "%s incoming changes - new heads: %s\n",
                                                 len(added),
                                                 ', '.join([hex(c[:6]) for c in newheads]))
                                 tr.addpostclose('changegroup-runhooks-%020i' % clstart,
                                                 lambda tr: repo._afterlock(runhooks))
                     finally:
                         repo.ui.flush()
                     # never return 0 here:
                     if dh < 0:
                         return dh - 1
                     else:
                         return dh + 1
             class cg2unpacker(cg1unpacker):
                 """Unpacker for cg2 streams.
                 cg2 streams add support for generaldelta, so the delta header
                 format is slightly different. All other features about the data
                 remain the same.
                 """
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '02'
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs = headertuple
                     flags = 0
                     return node, p1, p2, deltabase, cs, flags
             class cg3unpacker(cg2unpacker):
                 """Unpacker for cg3 streams.
                 cg3 streams add support for exchanging treemanifests and revlog
                 flags. It adds the revlog flags to the delta header and an empty chunk
                 separating manifests and files.
                 """
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
                 deltaheadersize = struct.calcsize(deltaheader)
                 version = '03'
                 _grouplistcount = 2 # One list of manifests and one list of files
                 def _deltaheader(self, headertuple, prevnode):
                     node, p1, p2, deltabase, cs, flags = headertuple
                     return node, p1, p2, deltabase, cs, flags
                 def _unpackmanifests(self, repo, revmap, trp, prog, numchanges):
                     super(cg3unpacker, self)._unpackmanifests(repo, revmap, trp, prog,
                                                               numchanges)
                     while True:
                         chunkdata = self.filelogheader()
                         if not chunkdata:
                             break
                         # If we get here, there are directory manifests in the changegroup
                         d = chunkdata["filename"]
                         repo.ui.debug("adding %s revisions\n" % d)
                         dirlog = repo.manifest.dirlog(d)
                         if not dirlog.addgroup(self, revmap, trp):
                             raise error.Abort(_("received dir revlog group is empty"))
             class headerlessfixup(object):
                 def __init__(self, fh, h):
                     self._h = h
                     self._fh = fh
                 def read(self, n):
                     if self._h:
                         d, self._h = self._h[:n], self._h[n:]
                         if len(d) < n:
                             d += readexactly(self._fh, n - len(d))
                         return d
                     return readexactly(self._fh, n)
             def _moddirs(files):
                 """Given a set of modified files, find the list of modified directories.
                 This returns a list of (path to changed dir, changed dir) tuples,
                 as that's what the one client needs anyway.
                 >>> _moddirs(['a/b/c.py', 'a/b/c.txt', 'a/d/e/f/g.txt', 'i.txt', ])
                 [('/', 'a/'), ('a/', 'b/'), ('a/', 'd/'), ('a/d/', 'e/'), ('a/d/e/', 'f/')]
                 """
                 alldirs = set()
                 for f in files:
                     path = f.split('/')[:-1]
                     for i in xrange(len(path) - 1, -1, -1):
                         dn = '/'.join(path[:i])
                         current = dn + '/', path[i] + '/'
                         if current in alldirs:
                             break
                         alldirs.add(current)
                 return sorted(alldirs)
             class cg1packer(object):
                 deltaheader = _CHANGEGROUPV1_DELTA_HEADER
                 version = '01'
                 def __init__(self, repo, bundlecaps=None):
                     """Given a source repo, construct a bundler.
                     bundlecaps is optional and can be used to specify the set of
                     capabilities which can be used to build the bundle.
                     """
                     # Set of capabilities we can use to build the bundle.
                     if bundlecaps is None:
                         bundlecaps = set()
                     self._bundlecaps = bundlecaps
                     # experimental config: bundle.reorder
                     reorder = repo.ui.config('bundle', 'reorder', 'auto')
                     if reorder == 'auto':
                         reorder = None
                     else:
                         reorder = util.parsebool(reorder)
                     self._repo = repo
                     self._reorder = reorder
                     self._progress = repo.ui.progress
                     if self._repo.ui.verbose and not self._repo.ui.debugflag:
                         self._verbosenote = self._repo.ui.note
                     else:
                         self._verbosenote = lambda s: None
                 def close(self):
                     return closechunk()
                 def fileheader(self, fname):
                     return chunkheader(len(fname)) + fname
                 def group(self, nodelist, revlog, lookup, units=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     If units is not None, progress detail will be generated, units specifies
                     the type of revlog that is touched (changelog, manifest, etc.).
                     """
                     # if we don't have any revisions touched by these changesets, bail
                     if len(nodelist) == 0:
                         yield self.close()
                         return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (revlog._generaldelta and self._reorder is None) or self._reorder:
                         dag = dagutil.revlogdag(revlog)
                         revs = set(revlog.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([revlog.rev(n) for n in nodelist])
                     # add the parent of the first rev
                     p = revlog.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     total = len(revs) - 1
                     msgbundling = _('bundling')
                     for r in xrange(len(revs) - 1):
                         if units is not None:
                             self._progress(msgbundling, r + 1, unit=units, total=total)
                         prev, curr = revs[r], revs[r + 1]
                         linknode = lookup(revlog.node(curr))
                         for c in self.revchunk(revlog, curr, prev, linknode):
                             yield c
                     if units is not None:
                         self._progress(msgbundling, None)
                     yield self.close()
                 # filter any nodes that claim to be part of the known set
                 def prune(self, revlog, missing, commonrevs):
                     rr, rl = revlog.rev, revlog.linkrev
                     return [n for n in missing if rl(rr(n)) not in commonrevs]
-                def _packmanifests(self, mfnodes, tmfnodes, lookuplinknode):
+                def _packmanifests(self, dir, mfnodes, lookuplinknode):
                     """Pack flat manifests into a changegroup stream."""
-                    ml = self._repo.manifest
+                    assert not dir
-                    size = 0
+                    for chunk in self.group(mfnodes, self._repo.manifest,
-                    for chunk in self.group(
+                                            lookuplinknode, units=_('manifests')):
-                            mfnodes, ml, lookuplinknode, units=_('manifests')):
-                        size += len(chunk)
                         yield chunk
-                    self._verbosenote(_('%8.i (manifests)\n') % size)
-                    # It looks odd to assert this here, but tmfnodes doesn't get
+                def _manifestsdone(self):
-                    # filled in until after we've called lookuplinknode for
+                    return ''
-                    # sending root manifests, so the only way to tell the streams
-                    # got crossed is to check after we've done all the work.
-                    assert not tmfnodes
                 def generate(self, commonrevs, clnodes, fastpathlinkrev, source):
                     '''yield a sequence of changegroup chunks (strings)'''
                     repo = self._repo
                     cl = repo.changelog
                     clrevorder = {}
                     mfs = {} # needed manifests
                     fnodes = {} # needed file nodes
                     # maps manifest node id -> set(changed files)
                     mfchangedfiles = {}
                     # Callback for the changelog, used to collect changed files and manifest
                     # nodes.
                     # Returns the linkrev node (identity in the changelog case).
                     def lookupcl(x):
                         c = cl.read(x)
                         clrevorder[x] = len(clrevorder)
                         n = c[0]
                         # record the first changeset introducing this manifest version
                         mfs.setdefault(n, x)
                         # Record a complete list of potentially-changed files in
                         # this manifest.
                         mfchangedfiles.setdefault(n, set()).update(c[3])
                         return x
                     self._verbosenote(_('uncompressed size of bundle content:\n'))
                     size = 0
                     for chunk in self.group(clnodes, cl, lookupcl, units=_('changesets')):
                         size += len(chunk)
                         yield chunk
                     self._verbosenote(_('%8.i (changelog)\n') % size)
                     # We need to make sure that the linkrev in the changegroup refers to
                     # the first changeset that introduced the manifest or file revision.
                     # The fastpath is usually safer than the slowpath, because the filelogs
                     # are walked in revlog order.
                     #
                     # When taking the slowpath with reorder=None and the manifest revlog
                     # uses generaldelta, the manifest may be walked in the "wrong" order.
                     # Without 'clrevorder', we would get an incorrect linkrev (see fix in
                     # cc0ff93d0c0c).
                     #
                     # When taking the fastpath, we are only vulnerable to reordering
                     # of the changelog itself. The changelog never uses generaldelta, so
                     # it is only reordered when reorder=True. To handle this case, we
                     # simply take the slowpath, which already has the 'clrevorder' logic.
                     # This was also fixed in cc0ff93d0c0c.
                     fastpathlinkrev = fastpathlinkrev and not self._reorder
                     # Treemanifests don't work correctly with fastpathlinkrev
                     # either, because we don't discover which directory nodes to
                     # send along with files. This could probably be fixed.
                     fastpathlinkrev = fastpathlinkrev and (
                         'treemanifest' not in repo.requirements)
                     for chunk in self.generatemanifests(commonrevs, clrevorder,
                             fastpathlinkrev, mfs, mfchangedfiles, fnodes):
                         yield chunk
                     mfs.clear()
                     clrevs = set(cl.rev(x) for x in clnodes)
                     if not fastpathlinkrev:
                         def linknodes(unused, fname):
                             return fnodes.get(fname, {})
                     else:
                         cln = cl.node
                         def linknodes(filerevlog, fname):
                             llr = filerevlog.linkrev
                             fln = filerevlog.node
                             revs = ((r, llr(r)) for r in filerevlog)
                             return dict((fln(r), cln(lr)) for r, lr in revs if lr in clrevs)
                     changedfiles = set()
                     for x in mfchangedfiles.itervalues():
                         changedfiles.update(x)
                     for chunk in self.generatefiles(changedfiles, linknodes, commonrevs,
                                                     source):
                         yield chunk
                     yield self.close()
                     if clnodes:
                         repo.hook('outgoing', node=hex(clnodes[0]), source=source)
                 def generatemanifests(self, commonrevs, clrevorder, fastpathlinkrev, mfs,
                                       mfchangedfiles, fnodes):
                     repo = self._repo
                     ml = repo.manifest
                     tmfnodes = {}
                     # Callback for the manifest, used to collect linkrevs for filelog
                     # revisions.
                     # Returns the linkrev node (collected in lookupcl).
                     if fastpathlinkrev:
                         lookupmflinknode = mfs.__getitem__
                     else:
                         def lookupmflinknode(x):
                             """Callback for looking up the linknode for manifests.
                             Returns the linkrev node for the specified manifest.
                             SIDE EFFECT:
 ) fclnodes gets populated with the list of relevant
                                file nodes if we're not using fastpathlinkrev
 ) When treemanifests are in use, collects treemanifest nodes
                                to send
                             Note that this means manifests must be completely sent to
                             the client before you can trust the list of files and
                             treemanifests to send.
                             """
                             clnode = mfs[x]
                             # We no longer actually care about reading deltas of
                             # the manifest here, because we already know the list
                             # of changed files, so for treemanifests (which
                             # lazily-load anyway to *generate* a readdelta) we can
                             # just load them with read() and then we'll actually
                             # be able to correctly load node IDs from the
                             # submanifest entries.
                             if 'treemanifest' in repo.requirements:
                                 mdata = ml.read(x)
                             else:
                                 mdata = ml.readfast(x)
                             for f in mfchangedfiles[x]:
                                 try:
                                     n = mdata[f]
                                 except KeyError:
                                     continue
                                 # record the first changeset introducing this filelog
                                 # version
                                 fclnodes = fnodes.setdefault(f, {})
                                 fclnode = fclnodes.setdefault(n, clnode)
                                 if clrevorder[clnode] < clrevorder[fclnode]:
                                     fclnodes[n] = clnode
                             # gather list of changed treemanifest nodes
                             if 'treemanifest' in repo.requirements:
                                 submfs = {'/': mdata}
                                 for dn, bn in _moddirs(mfchangedfiles[x]):
                                     try:
                                         submf = submfs[dn]
                                         submf = submf._dirs[bn]
                                     except KeyError:
                                         continue # deleted directory, so nothing to send
                                     submfs[submf.dir()] = submf
                                     tmfclnodes = tmfnodes.setdefault(submf.dir(), {})
                                     tmfclnode = tmfclnodes.setdefault(submf._node, clnode)
                                     if clrevorder[clnode] < clrevorder[tmfclnode]:
                                         tmfclnodes[n] = clnode
                             return clnode
                     mfnodes = self.prune(ml, mfs, commonrevs)
-                    for x in self._packmanifests(
+                    size = 0
-                        mfnodes, tmfnodes, lookupmflinknode):
+                    for x in self._packmanifests('', mfnodes, lookupmflinknode):
+                        size += len(x)
                         yield x
+                    self._verbosenote(_('%8.i (manifests)\n') % size)
+                    for dir, nodes in tmfnodes.iteritems():
+                        for x in self._packmanifests(dir, nodes, nodes.get):
+                            yield x
+                    yield self._manifestsdone()
                 # The 'source' parameter is useful for extensions
                 def generatefiles(self, changedfiles, linknodes, commonrevs, source):
                     repo = self._repo
                     progress = self._progress
                     msgbundling = _('bundling')
                     total = len(changedfiles)
                     # for progress output
                     msgfiles = _('files')
                     for i, fname in enumerate(sorted(changedfiles)):
                         filerevlog = repo.file(fname)
                         if not filerevlog:
                             raise error.Abort(_("empty or missing revlog for %s") % fname)
                         linkrevnodes = linknodes(filerevlog, fname)
                         # Lookup for filenodes, we collected the linkrev nodes above in the
                         # fastpath case and with lookupmf in the slowpath case.
                         def lookupfilelog(x):
                             return linkrevnodes[x]
                         filenodes = self.prune(filerevlog, linkrevnodes, commonrevs)
                         if filenodes:
                             progress(msgbundling, i + 1, item=fname, unit=msgfiles,
                                      total=total)
                             h = self.fileheader(fname)
                             size = len(h)
                             yield h
                             for chunk in self.group(filenodes, filerevlog, lookupfilelog):
                                 size += len(chunk)
                                 yield chunk
                             self._verbosenote(_('%8.i  %s\n') % (size, fname))
                     progress(msgbundling, None)
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     return prev
                 def revchunk(self, revlog, rev, prev, linknode):
                     node = revlog.node(rev)
                     p1, p2 = revlog.parentrevs(rev)
                     base = self.deltaparent(revlog, rev, p1, p2, prev)
                     prefix = ''
                     if revlog.iscensored(base) or revlog.iscensored(rev):
                         try:
                             delta = revlog.revision(node)
                         except error.CensoredNodeError as e:
                             delta = e.tombstone
                         if base == nullrev:
                             prefix = mdiff.trivialdiffheader(len(delta))
                         else:
                             baselen = revlog.rawsize(base)
                             prefix = mdiff.replacediffheader(baselen, len(delta))
                     elif base == nullrev:
                         delta = revlog.revision(node)
                         prefix = mdiff.trivialdiffheader(len(delta))
                     else:
                         delta = revlog.revdiff(base, rev)
                     p1n, p2n = revlog.parents(node)
                     basenode = revlog.node(base)
                     flags = revlog.flags(rev)
                     meta = self.builddeltaheader(node, p1n, p2n, basenode, linknode, flags)
                     meta += prefix
                     l = len(meta) + len(delta)
                     yield chunkheader(l)
                     yield meta
                     yield delta
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     # do nothing with basenode, it is implicitly the previous one in HG10
                     # do nothing with flags, it is implicitly 0 for cg1 and cg2
                     return struct.pack(self.deltaheader, node, p1n, p2n, linknode)
             class cg2packer(cg1packer):
                 version = '02'
                 deltaheader = _CHANGEGROUPV2_DELTA_HEADER
                 def __init__(self, repo, bundlecaps=None):
                     super(cg2packer, self).__init__(repo, bundlecaps)
                     if self._reorder is None:
                         # Since generaldelta is directly supported by cg2, reordering
                         # generally doesn't help, so we disable it by default (treating
                         # bundle.reorder=auto just like bundle.reorder=False).
                         self._reorder = False
                 def deltaparent(self, revlog, rev, p1, p2, prev):
                     dp = revlog.deltaparent(rev)
                     # avoid storing full revisions; pick prev in those cases
                     # also pick prev when we can't be sure remote has dp
                     if dp == nullrev or (dp != p1 and dp != p2 and dp != prev):
                         return prev
                     return dp
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     # Do nothing with flags, it is implicitly 0 in cg1 and cg2
                     return struct.pack(self.deltaheader, node, p1n, p2n, basenode, linknode)
             class cg3packer(cg2packer):
                 version = '03'
                 deltaheader = _CHANGEGROUPV3_DELTA_HEADER
-                def _packmanifests(self, mfnodes, tmfnodes, lookuplinknode):
+                def _packmanifests(self, dir, mfnodes, lookuplinknode):
-                    # Note that debug prints are super confusing in this code, as
+                    if dir:
-                    # tmfnodes gets populated by the calls to lookuplinknode in
+                        yield self.fileheader(dir)
-                    # the superclass's manifest packer. In the future we should
+                    for chunk in self.group(mfnodes, self._repo.manifest.dirlog(dir),
-                    # probably see if we can refactor this somehow to be less
+                                            lookuplinknode, units=_('manifests')):
-                    # confusing.
+                        yield chunk
-                    for x in super(cg3packer, self)._packmanifests(
-                        mfnodes, {}, lookuplinknode):
+                def _manifestsdone(self):
-                        yield x
+                    return self.close()
-                    dirlog = self._repo.manifest.dirlog
-                    for name, nodes in tmfnodes.iteritems():
-                        # For now, directory headers are simply file headers with
-                        # a trailing '/' on the path (already in the name).
-                        yield self.fileheader(name)
-                        for chunk in self.group(nodes, dirlog(name), nodes.get):
-                            yield chunk
-                    yield self.close()
                 def builddeltaheader(self, node, p1n, p2n, basenode, linknode, flags):
                     return struct.pack(
                         self.deltaheader, node, p1n, p2n, basenode, linknode, flags)
             _packermap = {'01': (cg1packer, cg1unpacker),
                          # cg2 adds support for exchanging generaldelta
                          '02': (cg2packer, cg2unpacker),
                          # cg3 adds support for exchanging revlog flags and treemanifests
                          '03': (cg3packer, cg3unpacker),
             }
             def allsupportedversions(ui):
                 versions = set(_packermap.keys())
                 versions.discard('03')
                 if (ui.configbool('experimental', 'changegroup3') or
                     ui.configbool('experimental', 'treemanifest')):
                     versions.add('03')
                 return versions
             # Changegroup versions that can be applied to the repo
             def supportedincomingversions(repo):
                 versions = allsupportedversions(repo.ui)
                 if 'treemanifest' in repo.requirements:
                     versions.add('03')
                 return versions
             # Changegroup versions that can be created from the repo
             def supportedoutgoingversions(repo):
                 versions = allsupportedversions(repo.ui)
                 if 'treemanifest' in repo.requirements:
                     # Versions 01 and 02 support only flat manifests and it's just too
                     # expensive to convert between the flat manifest and tree manifest on
                     # the fly. Since tree manifests are hashed differently, all of history
                     # would have to be converted. Instead, we simply don't even pretend to
                     # support versions 01 and 02.
                     versions.discard('01')
                     versions.discard('02')
                     versions.add('03')
                 return versions
             def safeversion(repo):
                 # Finds the smallest version that it's safe to assume clients of the repo
                 # will support. For example, all hg versions that support generaldelta also
                 # support changegroup 02.
                 versions = supportedoutgoingversions(repo)
                 if 'generaldelta' in repo.requirements:
                     versions.discard('01')
                 assert versions
                 return min(versions)
             def getbundler(version, repo, bundlecaps=None):
                 assert version in supportedoutgoingversions(repo)
                 return _packermap[version][0](repo, bundlecaps)
             def getunbundler(version, fh, alg):
                 return _packermap[version][1](fh, alg)
             def _changegroupinfo(repo, nodes, source):
                 if repo.ui.verbose or source == 'bundle':
                     repo.ui.status(_("%d changesets found\n") % len(nodes))
                 if repo.ui.debugflag:
                     repo.ui.debug("list of changesets:\n")
                     for node in nodes:
                         repo.ui.debug("%s\n" % hex(node))
             def getsubsetraw(repo, outgoing, bundler, source, fastpath=False):
                 repo = repo.unfiltered()
                 commonrevs = outgoing.common
                 csets = outgoing.missing
                 heads = outgoing.missingheads
                 # We go through the fast path if we get told to, or if all (unfiltered
                 # heads have been requested (since we then know there all linkrevs will
                 # be pulled by the client).
                 heads.sort()
                 fastpathlinkrev = fastpath or (
                         repo.filtername is None and heads == sorted(repo.heads()))
                 repo.hook('preoutgoing', throw=True, source=source)
                 _changegroupinfo(repo, csets, source)
                 return bundler.generate(commonrevs, csets, fastpathlinkrev, source)
             def getsubset(repo, outgoing, bundler, source, fastpath=False):
                 gengroup = getsubsetraw(repo, outgoing, bundler, source, fastpath)
                 return getunbundler(bundler.version, util.chunkbuffer(gengroup), None)
             def changegroupsubset(repo, roots, heads, source, version='01'):
                 """Compute a changegroup consisting of all the nodes that are
                 descendants of any of the roots and ancestors of any of the heads.
                 Return a chunkbuffer object whose read() method will return
                 successive changegroup chunks.
                 It is fairly complex as determining which filenodes and which
                 manifest nodes need to be included for the changeset to be complete
                 is non-trivial.
                 Another wrinkle is doing the reverse, figuring out which changeset in
                 the changegroup a particular filenode or manifestnode belongs to.
                 """
                 cl = repo.changelog
                 if not roots:
                     roots = [nullid]
                 discbases = []
                 for n in roots:
                     discbases.extend([p for p in cl.parents(n) if p != nullid])
                 # TODO: remove call to nodesbetween.
                 csets, roots, heads = cl.nodesbetween(roots, heads)
                 included = set(csets)
                 discbases = [n for n in discbases if n not in included]
                 outgoing = discovery.outgoing(cl, discbases, heads)
                 bundler = getbundler(version, repo)
                 return getsubset(repo, outgoing, bundler, source)
             def getlocalchangegroupraw(repo, source, outgoing, bundlecaps=None,
                                        version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing. Returns a raw changegroup generator."""
                 if not outgoing.missing:
                     return None
                 bundler = getbundler(version, repo, bundlecaps)
                 return getsubsetraw(repo, outgoing, bundler, source)
             def getlocalchangegroup(repo, source, outgoing, bundlecaps=None,
                                     version='01'):
                 """Like getbundle, but taking a discovery.outgoing as an argument.
                 This is only implemented for local repos and reuses potentially
                 precomputed sets in outgoing."""
                 if not outgoing.missing:
                     return None
                 bundler = getbundler(version, repo, bundlecaps)
                 return getsubset(repo, outgoing, bundler, source)
             def computeoutgoing(repo, heads, common):
                 """Computes which revs are outgoing given a set of common
                 and a set of heads.
                 This is a separate function so extensions can have access to
                 the logic.
                 Returns a discovery.outgoing object.
                 """
                 cl = repo.changelog
                 if common:
                     hasnode = cl.hasnode
                     common = [n for n in common if hasnode(n)]
                 else:
                     common = [nullid]
                 if not heads:
                     heads = cl.heads()
                 return discovery.outgoing(cl, common, heads)
             def getchangegroup(repo, source, heads=None, common=None, bundlecaps=None,
                                version='01'):
                 """Like changegroupsubset, but returns the set difference between the
                 ancestors of heads and the ancestors common.
                 If heads is None, use the local heads. If common is None, use [nullid].
                 The nodes in common might not all be known locally due to the way the
                 current discovery protocol works.
                 """
                 outgoing = computeoutgoing(repo, heads, common)
                 return getlocalchangegroup(repo, source, outgoing, bundlecaps=bundlecaps,
                                            version=version)
             def changegroup(repo, basenodes, source):
                 # to avoid a race we use changegroupsubset() (issue1320)
                 return changegroupsubset(repo, basenodes, repo.heads(), source)
             def _addchangegroupfiles(repo, source, revmap, trp, pr, needfiles):
                 revisions = 0
                 files = 0
                 while True:
                     chunkdata = source.filelogheader()
                     if not chunkdata:
                         break
                     f = chunkdata["filename"]
                     repo.ui.debug("adding %s revisions\n" % f)
                     pr()
                     fl = repo.file(f)
                     o = len(fl)
                     try:
                         if not fl.addgroup(source, revmap, trp):
                             raise error.Abort(_("received file revlog group is empty"))
                     except error.CensoredBaseError as e:
                         raise error.Abort(_("received delta base is censored: %s") % e)
                     revisions += len(fl) - o
                     files += 1
                     if f in needfiles:
                         needs = needfiles[f]
                         for new in xrange(o, len(fl)):
                             n = fl.node(new)
                             if n in needs:
                                 needs.remove(n)
                             else:
                                 raise error.Abort(
                                     _("received spurious file revlog entry"))
                         if not needs:
                             del needfiles[f]
                 repo.ui.progress(_('files'), None)
                 for f, needs in needfiles.iteritems():
                     fl = repo.file(f)
                     for n in needs:
                         try:
                             fl.rev(n)
                         except error.LookupError:
                             raise error.Abort(
                                 _('missing file data for %s:%s - run hg verify') %
                                 (f, hex(n)))
                 return revisions, files