upstream/mercurial-mirror Commit - r48353:65c51966

1

# streamclone.py - producing and consuming streaming repository data

1

# streamclone.py - producing and consuming streaming repository data

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import contextlib

10

import contextlib

11

import os

11

import os

12

import struct

12

import struct

13

14

from .i18n import _

14

from .i18n import _

15

from .pycompat import open

15

from .pycompat import open

16

from .interfaces import repository

16

from .interfaces import repository

17

from . import (

17

from . import (

18

cacheutil,

18

cacheutil,

19

error,

19

error,

20

narrowspec,

20

narrowspec,

21

phases,

21

phases,

22

pycompat,

22

pycompat,

23

requirements as requirementsmod,

23

requirements as requirementsmod,

24

scmutil,

24

scmutil,

25

store,

25

store,

26

util,

26

util,

27

)

27

)

28

29

30

def canperformstreamclone(pullop, bundle2=False):

30

def canperformstreamclone(pullop, bundle2=False):

31

"""Whether it is possible to perform a streaming clone as part of pull.

31

"""Whether it is possible to perform a streaming clone as part of pull.

32

33

``bundle2`` will cause the function to consider stream clone through

33

``bundle2`` will cause the function to consider stream clone through

34

bundle2 and only through bundle2.

34

bundle2 and only through bundle2.

35

36

Returns a tuple of (supported, requirements). ``supported`` is True if

36

Returns a tuple of (supported, requirements). ``supported`` is True if

37

streaming clone is supported and False otherwise. ``requirements`` is

37

streaming clone is supported and False otherwise. ``requirements`` is

38

a set of repo requirements from the remote, or ``None`` if stream clone

38

a set of repo requirements from the remote, or ``None`` if stream clone

39

isn't supported.

39

isn't supported.

40

"""

40

"""

41

repo = pullop.repo

41

repo = pullop.repo

42

remote = pullop.remote

42

remote = pullop.remote

43

44

bundle2supported = False

44

bundle2supported = False

45

if pullop.canusebundle2:

45

if pullop.canusebundle2:

46

if b'v2' in pullop.remotebundle2caps.get(b'stream', []):

46

if b'v2' in pullop.remotebundle2caps.get(b'stream', []):

47

bundle2supported = True

47

bundle2supported = True

48

# else

48

# else

49

# Server doesn't support bundle2 stream clone or doesn't support

49

# Server doesn't support bundle2 stream clone or doesn't support

50

# the versions we support. Fall back and possibly allow legacy.

50

# the versions we support. Fall back and possibly allow legacy.

51

52

# Ensures legacy code path uses available bundle2.

52

# Ensures legacy code path uses available bundle2.

53

if bundle2supported and not bundle2:

53

if bundle2supported and not bundle2:

54

return False, None

54

return False, None

55

# Ensures bundle2 doesn't try to do a stream clone if it isn't supported.

55

# Ensures bundle2 doesn't try to do a stream clone if it isn't supported.

56

elif bundle2 and not bundle2supported:

56

elif bundle2 and not bundle2supported:

57

return False, None

57

return False, None

58

59

# Streaming clone only works on empty repositories.

59

# Streaming clone only works on empty repositories.

60

if len(repo):

60

if len(repo):

61

return False, None

61

return False, None

62

63

# Streaming clone only works if all data is being requested.

63

# Streaming clone only works if all data is being requested.

64

if pullop.heads:

64

if pullop.heads:

65

return False, None

65

return False, None

66

67

streamrequested = pullop.streamclonerequested

67

streamrequested = pullop.streamclonerequested

68

69

# If we don't have a preference, let the server decide for us. This

69

# If we don't have a preference, let the server decide for us. This

70

# likely only comes into play in LANs.

70

# likely only comes into play in LANs.

71

if streamrequested is None:

71

if streamrequested is None:

72

# The server can advertise whether to prefer streaming clone.

72

# The server can advertise whether to prefer streaming clone.

73

streamrequested = remote.capable(b'stream-preferred')

73

streamrequested = remote.capable(b'stream-preferred')

74

75

if not streamrequested:

75

if not streamrequested:

76

return False, None

76

return False, None

77

78

# In order for stream clone to work, the client has to support all the

78

# In order for stream clone to work, the client has to support all the

79

# requirements advertised by the server.

79

# requirements advertised by the server.

80

#

80

#

81

# The server advertises its requirements via the "stream" and "streamreqs"

81

# The server advertises its requirements via the "stream" and "streamreqs"

82

# capability. "stream" (a value-less capability) is advertised if and only

82

# capability. "stream" (a value-less capability) is advertised if and only

83

# if the only requirement is "revlogv1." Else, the "streamreqs" capability

83

# if the only requirement is "revlogv1." Else, the "streamreqs" capability

84

# is advertised and contains a comma-delimited list of requirements.

84

# is advertised and contains a comma-delimited list of requirements.

85

requirements = set()

85

requirements = set()

86

if remote.capable(b'stream'):

86

if remote.capable(b'stream'):

87

requirements.add(requirementsmod.REVLOGV1_REQUIREMENT)

87

requirements.add(requirementsmod.REVLOGV1_REQUIREMENT)

88

else:

88

else:

89

streamreqs = remote.capable(b'streamreqs')

89

streamreqs = remote.capable(b'streamreqs')

90

# This is weird and shouldn't happen with modern servers.

90

# This is weird and shouldn't happen with modern servers.

91

if not streamreqs:

91

if not streamreqs:

92

pullop.repo.ui.warn(

92

pullop.repo.ui.warn(

93

_(

93

_(

94

b'warning: stream clone requested but server has them '

94

b'warning: stream clone requested but server has them '

95

b'disabled\n'

95

b'disabled\n'

96

)

96

)

97

)

97

)

98

return False, None

98

return False, None

99

100

streamreqs = set(streamreqs.split(b','))

100

streamreqs = set(streamreqs.split(b','))

101

# Server requires something we don't support. Bail.

101

# Server requires something we don't support. Bail.

102

missingreqs = streamreqs - repo.supportedformats

102

missingreqs = streamreqs - repo.supportedformats

103

if missingreqs:

103

if missingreqs:

104

pullop.repo.ui.warn(

104

pullop.repo.ui.warn(

105

_(

105

_(

106

b'warning: stream clone requested but client is missing '

106

b'warning: stream clone requested but client is missing '

107

b'requirements: %s\n'

107

b'requirements: %s\n'

108

)

108

)

109

% b', '.join(sorted(missingreqs))

109

% b', '.join(sorted(missingreqs))

110

)

110

)

111

pullop.repo.ui.warn(

111

pullop.repo.ui.warn(

112

_(

112

_(

113

b'(see https://www.mercurial-scm.org/wiki/MissingRequirement '

113

b'(see https://www.mercurial-scm.org/wiki/MissingRequirement '

114

b'for more information)\n'

114

b'for more information)\n'

115

)

115

)

116

)

116

)

117

return False, None

117

return False, None

118

requirements = streamreqs

118

requirements = streamreqs

119

120

return True, requirements

120

return True, requirements

121

122

123

def maybeperformlegacystreamclone(pullop):

123

def maybeperformlegacystreamclone(pullop):

124

"""Possibly perform a legacy stream clone operation.

124

"""Possibly perform a legacy stream clone operation.

125

126

Legacy stream clones are performed as part of pull but before all other

126

Legacy stream clones are performed as part of pull but before all other

127

operations.

127

operations.

128

129

A legacy stream clone will not be performed if a bundle2 stream clone is

129

A legacy stream clone will not be performed if a bundle2 stream clone is

130

supported.

130

supported.

131

"""

131

"""

132

from . import localrepo

132

from . import localrepo

133

134

supported, requirements = canperformstreamclone(pullop)

134

supported, requirements = canperformstreamclone(pullop)

135

136

if not supported:

136

if not supported:

137

return

137

return

138

139

repo = pullop.repo

139

repo = pullop.repo

140

remote = pullop.remote

140

remote = pullop.remote

141

142

# Save remote branchmap. We will use it later to speed up branchcache

142

# Save remote branchmap. We will use it later to speed up branchcache

143

# creation.

143

# creation.

144

rbranchmap = None

144

rbranchmap = None

145

if remote.capable(b'branchmap'):

145

if remote.capable(b'branchmap'):

146

with remote.commandexecutor() as e:

146

with remote.commandexecutor() as e:

147

rbranchmap = e.callcommand(b'branchmap', {}).result()

147

rbranchmap = e.callcommand(b'branchmap', {}).result()

148

149

repo.ui.status(_(b'streaming all changes\n'))

149

repo.ui.status(_(b'streaming all changes\n'))

150

151

with remote.commandexecutor() as e:

151

with remote.commandexecutor() as e:

152

fp = e.callcommand(b'stream_out', {}).result()

152

fp = e.callcommand(b'stream_out', {}).result()

153

154

# TODO strictly speaking, this code should all be inside the context

154

# TODO strictly speaking, this code should all be inside the context

155

# manager because the context manager is supposed to ensure all wire state

155

# manager because the context manager is supposed to ensure all wire state

156

# is flushed when exiting. But the legacy peers don't do this, so it

156

# is flushed when exiting. But the legacy peers don't do this, so it

157

# doesn't matter.

157

# doesn't matter.

158

l = fp.readline()

158

l = fp.readline()

159

try:

159

try:

160

resp = int(l)

160

resp = int(l)

161

except ValueError:

161

except ValueError:

162

raise error.ResponseError(

162

raise error.ResponseError(

163

_(b'unexpected response from remote server:'), l

163

_(b'unexpected response from remote server:'), l

164

)

164

)

165

if resp == 1:

165

if resp == 1:

166

raise error.Abort(_(b'operation forbidden by server'))

166

raise error.Abort(_(b'operation forbidden by server'))

167

elif resp == 2:

167

elif resp == 2:

168

raise error.Abort(_(b'locking the remote repository failed'))

168

raise error.Abort(_(b'locking the remote repository failed'))

169

elif resp != 0:

169

elif resp != 0:

170

raise error.Abort(_(b'the server sent an unknown error code'))

170

raise error.Abort(_(b'the server sent an unknown error code'))

171

172

l = fp.readline()

172

l = fp.readline()

173

try:

173

try:

174

filecount, bytecount = map(int, l.split(b' ', 1))

174

filecount, bytecount = map(int, l.split(b' ', 1))

175

except (ValueError, TypeError):

175

except (ValueError, TypeError):

176

raise error.ResponseError(

176

raise error.ResponseError(

177

_(b'unexpected response from remote server:'), l

177

_(b'unexpected response from remote server:'), l

178

)

178

)

179

180

with repo.lock():

180

with repo.lock():

181

consumev1(repo, fp, filecount, bytecount)

181

consumev1(repo, fp, filecount, bytecount)

182

183

# new requirements = old non-format requirements +

183

# new requirements = old non-format requirements +

184

# new format-related remote requirements

184

# new format-related remote requirements

185

# requirements from the streamed-in repository

185

# requirements from the streamed-in repository

186

repo.requirements = requirements | (

186

repo.requirements = requirements | (

187

repo.requirements - repo.supportedformats

187

repo.requirements - repo.supportedformats

188

)

188

)

189

repo.svfs.options = localrepo.resolvestorevfsoptions(

189

repo.svfs.options = localrepo.resolvestorevfsoptions(

190

repo.ui, repo.requirements, repo.features

190

repo.ui, repo.requirements, repo.features

191

)

191

)

192

scmutil.writereporequirements(repo)

192

scmutil.writereporequirements(repo)

193

194

if rbranchmap:

194

if rbranchmap:

195

repo._branchcaches.replace(repo, rbranchmap)

195

repo._branchcaches.replace(repo, rbranchmap)

196

197

repo.invalidate()

197

repo.invalidate()

198

199

200

def allowservergeneration(repo):

200

def allowservergeneration(repo):

201

"""Whether streaming clones are allowed from the server."""

201

"""Whether streaming clones are allowed from the server."""

202

if repository.REPO_FEATURE_STREAM_CLONE not in repo.features:

202

if repository.REPO_FEATURE_STREAM_CLONE not in repo.features:

203

return False

203

return False

204

205

if not repo.ui.configbool(b'server', b'uncompressed', untrusted=True):

205

if not repo.ui.configbool(b'server', b'uncompressed', untrusted=True):

206

return False

206

return False

207

208

# The way stream clone works makes it impossible to hide secret changesets.

208

# The way stream clone works makes it impossible to hide secret changesets.

209

# So don't allow this by default.

209

# So don't allow this by default.

210

secret = phases.hassecret(repo)

210

secret = phases.hassecret(repo)

211

if secret:

211

if secret:

212

return repo.ui.configbool(b'server', b'uncompressedallowsecret')

212

return repo.ui.configbool(b'server', b'uncompressedallowsecret')

213

214

return True

214

return True

215

216

217

# This is it's own function so extensions can override it.

217

# This is it's own function so extensions can override it.

218

def _walkstreamfiles(repo, matcher=None):

218

def _walkstreamfiles(repo, matcher=None):

219

return repo.store.walk(matcher)

219

return repo.store.walk(matcher)

220

221

222

def generatev1(repo):

222

def generatev1(repo):

223

"""Emit content for version 1 of a streaming clone.

223

"""Emit content for version 1 of a streaming clone.

224

225

This returns a 3-tuple of (file count, byte size, data iterator).

225

This returns a 3-tuple of (file count, byte size, data iterator).

226

227

The data iterator consists of N entries for each file being transferred.

227

The data iterator consists of N entries for each file being transferred.

228

Each file entry starts as a line with the file name and integer size

228

Each file entry starts as a line with the file name and integer size

229

delimited by a null byte.

229

delimited by a null byte.

230

231

The raw file data follows. Following the raw file data is the next file

231

The raw file data follows. Following the raw file data is the next file

232

entry, or EOF.

232

entry, or EOF.

233

234

When used on the wire protocol, an additional line indicating protocol

234

When used on the wire protocol, an additional line indicating protocol

235

success will be prepended to the stream. This function is not responsible

235

success will be prepended to the stream. This function is not responsible

236

for adding it.

236

for adding it.

237

238

This function will obtain a repository lock to ensure a consistent view of

238

This function will obtain a repository lock to ensure a consistent view of

239

the store is captured. It therefore may raise LockError.

239

the store is captured. It therefore may raise LockError.

240

"""

240

"""

241

entries = []

241

entries = []

242

total_bytes = 0

242

total_bytes = 0

243

# Get consistent snapshot of repo, lock during scan.

243

# Get consistent snapshot of repo, lock during scan.

244

with repo.lock():

244

with repo.lock():

245

repo.ui.debug(b'scanning\n')

245

repo.ui.debug(b'scanning\n')

246

for file_type, name, ename, size in _walkstreamfiles(repo):

246

for file_type, name, ename, size in _walkstreamfiles(repo):

247

if size:

247

if size:

248

entries.append((name, size))

248

entries.append((name, size))

249

total_bytes += size

249

total_bytes += size

250

_test_sync_point_walk_1(repo)

250

_test_sync_point_walk_1(repo)

251

_test_sync_point_walk_2(repo)

251

_test_sync_point_walk_2(repo)

252

253

repo.ui.debug(

253

repo.ui.debug(

254

b'%d files, %d bytes to transfer\n' % (len(entries), total_bytes)

254

b'%d files, %d bytes to transfer\n' % (len(entries), total_bytes)

255

)

255

)

256

257

svfs = repo.svfs

257

svfs = repo.svfs

258

debugflag = repo.ui.debugflag

258

debugflag = repo.ui.debugflag

259

260

def emitrevlogdata():

260

def emitrevlogdata():

261

for name, size in entries:

261

for name, size in entries:

262

if debugflag:

262

if debugflag:

263

repo.ui.debug(b'sending %s (%d bytes)\n' % (name, size))

263

repo.ui.debug(b'sending %s (%d bytes)\n' % (name, size))

264

# partially encode name over the wire for backwards compat

264

# partially encode name over the wire for backwards compat

265

yield b'%s\0%d\n' % (store.encodedir(name), size)

265

yield b'%s\0%d\n' % (store.encodedir(name), size)

266

# auditing at this stage is both pointless (paths are already

266

# auditing at this stage is both pointless (paths are already

267

# trusted by the local repo) and expensive

267

# trusted by the local repo) and expensive

268

with svfs(name, b'rb', auditpath=False) as fp:

268

with svfs(name, b'rb', auditpath=False) as fp:

269

if size <= 65536:

269

if size <= 65536:

270

yield fp.read(size)

270

yield fp.read(size)

271

else:

271

else:

272

for chunk in util.filechunkiter(fp, limit=size):

272

for chunk in util.filechunkiter(fp, limit=size):

273

yield chunk

273

yield chunk

274

275

return len(entries), total_bytes, emitrevlogdata()

275

return len(entries), total_bytes, emitrevlogdata()

276

277

278

def generatev1wireproto(repo):

278

def generatev1wireproto(repo):

279

"""Emit content for version 1 of streaming clone suitable for the wire.

279

"""Emit content for version 1 of streaming clone suitable for the wire.

280

281

This is the data output from ``generatev1()`` with 2 header lines. The

281

This is the data output from ``generatev1()`` with 2 header lines. The

282

first line indicates overall success. The 2nd contains the file count and

282

first line indicates overall success. The 2nd contains the file count and

283

byte size of payload.

283

byte size of payload.

284

285

The success line contains "0" for success, "1" for stream generation not

285

The success line contains "0" for success, "1" for stream generation not

286

allowed, and "2" for error locking the repository (possibly indicating

286

allowed, and "2" for error locking the repository (possibly indicating

287

a permissions error for the server process).

287

a permissions error for the server process).

288

"""

288

"""

289

if not allowservergeneration(repo):

289

if not allowservergeneration(repo):

290

yield b'1\n'

290

yield b'1\n'

291

return

291

return

292

293

try:

293

try:

294

filecount, bytecount, it = generatev1(repo)

294

filecount, bytecount, it = generatev1(repo)

295

except error.LockError:

295

except error.LockError:

296

yield b'2\n'

296

yield b'2\n'

297

return

297

return

298

299

# Indicates successful response.

299

# Indicates successful response.

300

yield b'0\n'

300

yield b'0\n'

301

yield b'%d %d\n' % (filecount, bytecount)

301

yield b'%d %d\n' % (filecount, bytecount)

302

for chunk in it:

302

for chunk in it:

303

yield chunk

303

yield chunk

304

305

306

def generatebundlev1(repo, compression=b'UN'):

306

def generatebundlev1(repo, compression=b'UN'):

307

"""Emit content for version 1 of a stream clone bundle.

307

"""Emit content for version 1 of a stream clone bundle.

308

309

The first 4 bytes of the output ("HGS1") denote this as stream clone

309

The first 4 bytes of the output ("HGS1") denote this as stream clone

310

bundle version 1.

310

bundle version 1.

311

312

The next 2 bytes indicate the compression type. Only "UN" is currently

312

The next 2 bytes indicate the compression type. Only "UN" is currently

313

supported.

313

supported.

314

315

The next 16 bytes are two 64-bit big endian unsigned integers indicating

315

The next 16 bytes are two 64-bit big endian unsigned integers indicating

316

file count and byte count, respectively.

316

file count and byte count, respectively.

317

318

The next 2 bytes is a 16-bit big endian unsigned short declaring the length

318

The next 2 bytes is a 16-bit big endian unsigned short declaring the length

319

of the requirements string, including a trailing \0. The following N bytes

319

of the requirements string, including a trailing \0. The following N bytes

320

are the requirements string, which is ASCII containing a comma-delimited

320

are the requirements string, which is ASCII containing a comma-delimited

321

list of repo requirements that are needed to support the data.

321

list of repo requirements that are needed to support the data.

322

323

The remaining content is the output of ``generatev1()`` (which may be

323

The remaining content is the output of ``generatev1()`` (which may be

324

compressed in the future).

324

compressed in the future).

325

326

Returns a tuple of (requirements, data generator).

326

Returns a tuple of (requirements, data generator).

327

"""

327

"""

328

if compression != b'UN':

328

if compression != b'UN':

329

raise ValueError(b'we do not support the compression argument yet')

329

raise ValueError(b'we do not support the compression argument yet')

330

331

requirements = repo.requirements & repo.supportedformats

331

requirements = repo.requirements & repo.supportedformats

332

requires = b','.join(sorted(requirements))

332

requires = b','.join(sorted(requirements))

333

334

def gen():

334

def gen():

335

yield b'HGS1'

335

yield b'HGS1'

336

yield compression

336

yield compression

337

338

filecount, bytecount, it = generatev1(repo)

338

filecount, bytecount, it = generatev1(repo)

339

repo.ui.status(

339

repo.ui.status(

340

_(b'writing %d bytes for %d files\n') % (bytecount, filecount)

340

_(b'writing %d bytes for %d files\n') % (bytecount, filecount)

341

)

341

)

342

343

yield struct.pack(b'>QQ', filecount, bytecount)

343

yield struct.pack(b'>QQ', filecount, bytecount)

344

yield struct.pack(b'>H', len(requires) + 1)

344

yield struct.pack(b'>H', len(requires) + 1)

345

yield requires + b'\0'

345

yield requires + b'\0'

346

347

# This is where we'll add compression in the future.

347

# This is where we'll add compression in the future.

348

assert compression == b'UN'

348

assert compression == b'UN'

349

350

progress = repo.ui.makeprogress(

350

progress = repo.ui.makeprogress(

351

_(b'bundle'), total=bytecount, unit=_(b'bytes')

351

_(b'bundle'), total=bytecount, unit=_(b'bytes')

352

)

352

)

353

progress.update(0)

353

progress.update(0)

354

355

for chunk in it:

355

for chunk in it:

356

progress.increment(step=len(chunk))

356

progress.increment(step=len(chunk))

357

yield chunk

357

yield chunk

358

359

progress.complete()

359

progress.complete()

360

361

return requirements, gen()

361

return requirements, gen()

362

363

364

def consumev1(repo, fp, filecount, bytecount):

364

def consumev1(repo, fp, filecount, bytecount):

365

"""Apply the contents from version 1 of a streaming clone file handle.

365

"""Apply the contents from version 1 of a streaming clone file handle.

366

367

This takes the output from "stream_out" and applies it to the specified

367

This takes the output from "stream_out" and applies it to the specified

368

repository.

368

repository.

369

370

Like "stream_out," the status line added by the wire protocol is not

370

Like "stream_out," the status line added by the wire protocol is not

371

handled by this function.

371

handled by this function.

372

"""

372

"""

373

with repo.lock():

373

with repo.lock():

374

repo.ui.status(

374

repo.ui.status(

375

_(b'%d files to transfer, %s of data\n')

375

_(b'%d files to transfer, %s of data\n')

376

% (filecount, util.bytecount(bytecount))

376

% (filecount, util.bytecount(bytecount))

377

)

377

)

378

progress = repo.ui.makeprogress(

378

progress = repo.ui.makeprogress(

379

_(b'clone'), total=bytecount, unit=_(b'bytes')

379

_(b'clone'), total=bytecount, unit=_(b'bytes')

380

)

380

)

381

progress.update(0)

381

progress.update(0)

382

start = util.timer()

382

start = util.timer()

383

384

# TODO: get rid of (potential) inconsistency

384

# TODO: get rid of (potential) inconsistency

385

#

385

#

386

# If transaction is started and any @filecache property is

386

# If transaction is started and any @filecache property is

387

# changed at this point, it causes inconsistency between

387

# changed at this point, it causes inconsistency between

388

# in-memory cached property and streamclone-ed file on the

388

# in-memory cached property and streamclone-ed file on the

389

# disk. Nested transaction prevents transaction scope "clone"

389

# disk. Nested transaction prevents transaction scope "clone"

390

# below from writing in-memory changes out at the end of it,

390

# below from writing in-memory changes out at the end of it,

391

# even though in-memory changes are discarded at the end of it

391

# even though in-memory changes are discarded at the end of it

392

# regardless of transaction nesting.

392

# regardless of transaction nesting.

393

#

393

#

394

# But transaction nesting can't be simply prohibited, because

394

# But transaction nesting can't be simply prohibited, because

395

# nesting occurs also in ordinary case (e.g. enabling

395

# nesting occurs also in ordinary case (e.g. enabling

396

# clonebundles).

396

# clonebundles).

397

398

with repo.transaction(b'clone'):

398

with repo.transaction(b'clone'):

399

with repo.svfs.backgroundclosing(repo.ui, expectedcount=filecount):

399

with repo.svfs.backgroundclosing(repo.ui, expectedcount=filecount):

400

for i in pycompat.xrange(filecount):

400

for i in pycompat.xrange(filecount):

401

# XXX doesn't support '\n' or '\r' in filenames

401

# XXX doesn't support '\n' or '\r' in filenames

402

l = fp.readline()

402

l = fp.readline()

403

try:

403

try:

404

name, size = l.split(b'\0', 1)

404

name, size = l.split(b'\0', 1)

405

size = int(size)

405

size = int(size)

406

except (ValueError, TypeError):

406

except (ValueError, TypeError):

407

raise error.ResponseError(

407

raise error.ResponseError(

408

_(b'unexpected response from remote server:'), l

408

_(b'unexpected response from remote server:'), l

409

)

409

)

410

if repo.ui.debugflag:

410

if repo.ui.debugflag:

411

repo.ui.debug(

411

repo.ui.debug(

412

b'adding %s (%s)\n' % (name, util.bytecount(size))

412

b'adding %s (%s)\n' % (name, util.bytecount(size))

413

)

413

)

414

# for backwards compat, name was partially encoded

414

# for backwards compat, name was partially encoded

415

path = store.decodedir(name)

415

path = store.decodedir(name)

416

with repo.svfs(path, b'w', backgroundclose=True) as ofp:

416

with repo.svfs(path, b'w', backgroundclose=True) as ofp:

417

for chunk in util.filechunkiter(fp, limit=size):

417

for chunk in util.filechunkiter(fp, limit=size):

418

progress.increment(step=len(chunk))

418

progress.increment(step=len(chunk))

419

ofp.write(chunk)

419

ofp.write(chunk)

420

421

# force @filecache properties to be reloaded from

421

# force @filecache properties to be reloaded from

422

# streamclone-ed file at next access

422

# streamclone-ed file at next access

423

repo.invalidate(clearfilecache=True)

423

repo.invalidate(clearfilecache=True)

424

425

elapsed = util.timer() - start

425

elapsed = util.timer() - start

426

if elapsed <= 0:

426

if elapsed <= 0:

427

elapsed = 0.001

427

elapsed = 0.001

428

progress.complete()

428

progress.complete()

429

repo.ui.status(

429

repo.ui.status(

430

_(b'transferred %s in %.1f seconds (%s/sec)\n')

430

_(b'transferred %s in %.1f seconds (%s/sec)\n')

431

% (

431

% (

432

util.bytecount(bytecount),

432

util.bytecount(bytecount),

433

elapsed,

433

elapsed,

434

util.bytecount(bytecount / elapsed),

434

util.bytecount(bytecount / elapsed),

435

)

435

)

436

)

436

)

437

438

439

def readbundle1header(fp):

439

def readbundle1header(fp):

440

compression = fp.read(2)

440

compression = fp.read(2)

441

if compression != b'UN':

441

if compression != b'UN':

442

raise error.Abort(

442

raise error.Abort(

443

_(

443

_(

444

b'only uncompressed stream clone bundles are '

444

b'only uncompressed stream clone bundles are '

445

b'supported; got %s'

445

b'supported; got %s'

446

)

446

)

447

% compression

447

% compression

448

)

448

)

449

450

filecount, bytecount = struct.unpack(b'>QQ', fp.read(16))

450

filecount, bytecount = struct.unpack(b'>QQ', fp.read(16))

451

requireslen = struct.unpack(b'>H', fp.read(2))[0]

451

requireslen = struct.unpack(b'>H', fp.read(2))[0]

452

requires = fp.read(requireslen)

452

requires = fp.read(requireslen)

453

454

if not requires.endswith(b'\0'):

454

if not requires.endswith(b'\0'):

455

raise error.Abort(

455

raise error.Abort(

456

_(

456

_(

457

b'malformed stream clone bundle: '

457

b'malformed stream clone bundle: '

458

b'requirements not properly encoded'

458

b'requirements not properly encoded'

459

)

459

)

460

)

460

)

461

462

requirements = set(requires.rstrip(b'\0').split(b','))

462

requirements = set(requires.rstrip(b'\0').split(b','))

463

464

return filecount, bytecount, requirements

464

return filecount, bytecount, requirements

465

466

467

def applybundlev1(repo, fp):

467

def applybundlev1(repo, fp):

468

"""Apply the content from a stream clone bundle version 1.

468

"""Apply the content from a stream clone bundle version 1.

469

470

We assume the 4 byte header has been read and validated and the file handle

470

We assume the 4 byte header has been read and validated and the file handle

471

is at the 2 byte compression identifier.

471

is at the 2 byte compression identifier.

472

"""

472

"""

473

if len(repo):

473

if len(repo):

474

raise error.Abort(

474

raise error.Abort(

475

_(b'cannot apply stream clone bundle on non-empty repo')

475

_(b'cannot apply stream clone bundle on non-empty repo')

476

)

476

)

477

478

filecount, bytecount, requirements = readbundle1header(fp)

478

filecount, bytecount, requirements = readbundle1header(fp)

479

missingreqs = requirements - repo.supportedformats

479

missingreqs = requirements - repo.supportedformats

480

if missingreqs:

480

if missingreqs:

481

raise error.Abort(

481

raise error.Abort(

482

_(b'unable to apply stream clone: unsupported format: %s')

482

_(b'unable to apply stream clone: unsupported format: %s')

483

% b', '.join(sorted(missingreqs))

483

% b', '.join(sorted(missingreqs))

484

)

484

)

485

486

consumev1(repo, fp, filecount, bytecount)

486

consumev1(repo, fp, filecount, bytecount)

487

488

489

class streamcloneapplier(object):

489

class streamcloneapplier(object):

490

"""Class to manage applying streaming clone bundles.

490

"""Class to manage applying streaming clone bundles.

491

492

We need to wrap ``applybundlev1()`` in a dedicated type to enable bundle

492

We need to wrap ``applybundlev1()`` in a dedicated type to enable bundle

493

readers to perform bundle type-specific functionality.

493

readers to perform bundle type-specific functionality.

494

"""

494

"""

495

496

def __init__(self, fh):

496

def __init__(self, fh):

497

self._fh = fh

497

self._fh = fh

498

499

def apply(self, repo):

499

def apply(self, repo):

500

return applybundlev1(repo, self._fh)

500

return applybundlev1(repo, self._fh)

501

502

503

# type of file to stream

503

# type of file to stream

504

_fileappend = 0 # append only file

504

_fileappend = 0 # append only file

505

_filefull = 1 # full snapshot file

505

_filefull = 1 # full snapshot file

506

507

# Source of the file

507

# Source of the file

508

_srcstore = b's' # store (svfs)

508

_srcstore = b's' # store (svfs)

509

_srccache = b'c' # cache (cache)

509

_srccache = b'c' # cache (cache)

510

511

# This is it's own function so extensions can override it.

511

# This is it's own function so extensions can override it.

512

def _walkstreamfullstorefiles(repo):

512

def _walkstreamfullstorefiles(repo):

513

"""list snapshot file from the store"""

513

"""list snapshot file from the store"""

514

fnames = []

514

fnames = []

515

if not repo.publishing():

515

if not repo.publishing():

516

fnames.append(b'phaseroots')

516

fnames.append(b'phaseroots')

517

return fnames

517

return fnames

518

519

520

def _filterfull(entry, copy, vfsmap):

520

def _filterfull(entry, copy, vfsmap):

521

"""actually copy the snapshot files"""

521

"""actually copy the snapshot files"""

522

src, name, ftype, data = entry

522

src, name, ftype, data = entry

523

if ftype != _filefull:

523

if ftype != _filefull:

524

return entry

524

return entry

525

return (src, name, ftype, copy(vfsmap[src].join(name)))

525

return (src, name, ftype, copy(vfsmap[src].join(name)))

526

527

528

@contextlib.contextmanager

528

@contextlib.contextmanager

529

def maketempcopies():

529

def maketempcopies():

530

"""return a function to temporary copy file"""

530

"""return a function to temporary copy file"""

531

files = []

531

files = []

532

try:

532

try:

533

534

def copy(src):

534

def copy(src):

535

fd, dst = pycompat.mkstemp()

535

fd, dst = pycompat.mkstemp()

536

os.close(fd)

536

os.close(fd)

537

files.append(dst)

537

files.append(dst)

538

util.copyfiles(src, dst, hardlink=True)

538

util.copyfiles(src, dst, hardlink=True)

539

return dst

539

return dst

540

541

yield copy

541

yield copy

542

finally:

542

finally:

543

for tmp in files:

543

for tmp in files:

544

util.tryunlink(tmp)

544

util.tryunlink(tmp)

545

546

547

def _makemap(repo):

547

def _makemap(repo):

548

"""make a (src -> vfs) map for the repo"""

548

"""make a (src -> vfs) map for the repo"""

549

vfsmap = {

549

vfsmap = {

550

_srcstore: repo.svfs,

550

_srcstore: repo.svfs,

551

_srccache: repo.cachevfs,

551

_srccache: repo.cachevfs,

552

}

552

}

553

# we keep repo.vfs out of the on purpose, ther are too many danger there

553

# we keep repo.vfs out of the on purpose, ther are too many danger there

554

# (eg: .hg/hgrc)

554

# (eg: .hg/hgrc)

555

assert repo.vfs not in vfsmap.values()

555

assert repo.vfs not in vfsmap.values()

556

557

return vfsmap

557

return vfsmap

558

559

560

def _emit2(repo, entries, totalfilesize):

560

def _emit2(repo, entries, totalfilesize):

561

"""actually emit the stream bundle"""

561

"""actually emit the stream bundle"""

562

vfsmap = _makemap(repo)

562

vfsmap = _makemap(repo)

563

# we keep repo.vfs out of the on purpose, ther are too many danger there

564

# (eg: .hg/hgrc),

565

#

566

# this assert is duplicated (from _makemap) as author might think this is

567

# fine, while this is really not fine.

568

if repo.vfs in vfsmap.values():

569

raise error.ProgrammingError(

570

b'repo.vfs must not be added to vfsmap for security reasons'

571

)

572

563

progress = repo.ui.makeprogress(

573

progress = repo.ui.makeprogress(

564

_(b'bundle'), total=totalfilesize, unit=_(b'bytes')

574

_(b'bundle'), total=totalfilesize, unit=_(b'bytes')

565

)

575

)

566

progress.update(0)

576

progress.update(0)

567

with maketempcopies() as copy, progress:

577

with maketempcopies() as copy, progress:

568

# copy is delayed until we are in the try

578

# copy is delayed until we are in the try

569

entries = [_filterfull(e, copy, vfsmap) for e in entries]

579

entries = [_filterfull(e, copy, vfsmap) for e in entries]

570

yield None # this release the lock on the repository

580

yield None # this release the lock on the repository

571

seen = 0

581

seen = 0

572

582

573

for src, name, ftype, data in entries:

583

for src, name, ftype, data in entries:

574

vfs = vfsmap[src]

584

vfs = vfsmap[src]

575

yield src

585

yield src

576

yield util.uvarintencode(len(name))

586

yield util.uvarintencode(len(name))

577

if ftype == _fileappend:

587

if ftype == _fileappend:

578

fp = vfs(name)

588

fp = vfs(name)

579

size = data

589

size = data

580

elif ftype == _filefull:

590

elif ftype == _filefull:

581

fp = open(data, b'rb')

591

fp = open(data, b'rb')

582

size = util.fstat(fp).st_size

592

size = util.fstat(fp).st_size

583

try:

593

try:

584

yield util.uvarintencode(size)

594

yield util.uvarintencode(size)

585

yield name

595

yield name

586

if size <= 65536:

596

if size <= 65536:

587

chunks = (fp.read(size),)

597

chunks = (fp.read(size),)

588

else:

598

else:

589

chunks = util.filechunkiter(fp, limit=size)

599

chunks = util.filechunkiter(fp, limit=size)

590

for chunk in chunks:

600

for chunk in chunks:

591

seen += len(chunk)

601

seen += len(chunk)

592

progress.update(seen)

602

progress.update(seen)

593

yield chunk

603

yield chunk

594

finally:

604

finally:

595

fp.close()

605

fp.close()

596

606

597

607

598

def _test_sync_point_walk_1(repo):

608

def _test_sync_point_walk_1(repo):

599

"""a function for synchronisation during tests"""

609

"""a function for synchronisation during tests"""

600

610

601

611

602

def _test_sync_point_walk_2(repo):

612

def _test_sync_point_walk_2(repo):

603

"""a function for synchronisation during tests"""

613

"""a function for synchronisation during tests"""

604

614

605

615

606

def generatev2(repo, includes, excludes, includeobsmarkers):

616

def generatev2(repo, includes, excludes, includeobsmarkers):

607

"""Emit content for version 2 of a streaming clone.

617

"""Emit content for version 2 of a streaming clone.

608

618

609

the data stream consists the following entries:

619

the data stream consists the following entries:

610

1) A char representing the file destination (eg: store or cache)

620

1) A char representing the file destination (eg: store or cache)

611

2) A varint containing the length of the filename

621

2) A varint containing the length of the filename

612

3) A varint containing the length of file data

622

3) A varint containing the length of file data

613

4) N bytes containing the filename (the internal, store-agnostic form)

623

4) N bytes containing the filename (the internal, store-agnostic form)

614

5) N bytes containing the file data

624

5) N bytes containing the file data

615

625

616

Returns a 3-tuple of (file count, file size, data iterator).

626

Returns a 3-tuple of (file count, file size, data iterator).

617

"""

627

"""

618

628

619

with repo.lock():

629

with repo.lock():

620

630

621

entries = []

631

entries = []

622

totalfilesize = 0

632

totalfilesize = 0

623

633

624

matcher = None

634

matcher = None

625

if includes or excludes:

635

if includes or excludes:

626

matcher = narrowspec.match(repo.root, includes, excludes)

636

matcher = narrowspec.match(repo.root, includes, excludes)

627

637

628

repo.ui.debug(b'scanning\n')

638

repo.ui.debug(b'scanning\n')

629

for rl_type, name, ename, size in _walkstreamfiles(repo, matcher):

639

for rl_type, name, ename, size in _walkstreamfiles(repo, matcher):

630

if size:

640

if size:

631

ft = _fileappend

641

ft = _fileappend

632

if rl_type & store.FILEFLAGS_VOLATILE:

642

if rl_type & store.FILEFLAGS_VOLATILE:

633

ft = _filefull

643

ft = _filefull

634

entries.append((_srcstore, name, ft, size))

644

entries.append((_srcstore, name, ft, size))

635

totalfilesize += size

645

totalfilesize += size

636

for name in _walkstreamfullstorefiles(repo):

646

for name in _walkstreamfullstorefiles(repo):

637

if repo.svfs.exists(name):

647

if repo.svfs.exists(name):

638

totalfilesize += repo.svfs.lstat(name).st_size

648

totalfilesize += repo.svfs.lstat(name).st_size

639

entries.append((_srcstore, name, _filefull, None))

649

entries.append((_srcstore, name, _filefull, None))

640

if includeobsmarkers and repo.svfs.exists(b'obsstore'):

650

if includeobsmarkers and repo.svfs.exists(b'obsstore'):

641

totalfilesize += repo.svfs.lstat(b'obsstore').st_size

651

totalfilesize += repo.svfs.lstat(b'obsstore').st_size

642

entries.append((_srcstore, b'obsstore', _filefull, None))

652

entries.append((_srcstore, b'obsstore', _filefull, None))

643

for name in cacheutil.cachetocopy(repo):

653

for name in cacheutil.cachetocopy(repo):

644

if repo.cachevfs.exists(name):

654

if repo.cachevfs.exists(name):

645

totalfilesize += repo.cachevfs.lstat(name).st_size

655

totalfilesize += repo.cachevfs.lstat(name).st_size

646

entries.append((_srccache, name, _filefull, None))

656

entries.append((_srccache, name, _filefull, None))

647

657

648

chunks = _emit2(repo, entries, totalfilesize)

658

chunks = _emit2(repo, entries, totalfilesize)

649

first = next(chunks)

659

first = next(chunks)

650

assert first is None

660

assert first is None

651

_test_sync_point_walk_1(repo)

661

_test_sync_point_walk_1(repo)

652

_test_sync_point_walk_2(repo)

662

_test_sync_point_walk_2(repo)

653

663

654

return len(entries), totalfilesize, chunks

664

return len(entries), totalfilesize, chunks

655

665

656

666

657

@contextlib.contextmanager

667

@contextlib.contextmanager

658

def nested(*ctxs):

668

def nested(*ctxs):

659

this = ctxs[0]

669

this = ctxs[0]

660

rest = ctxs[1:]

670

rest = ctxs[1:]

661

with this:

671

with this:

662

if rest:

672

if rest:

663

with nested(*rest):

673

with nested(*rest):

664

yield

674

yield

665

else:

675

else:

666

yield

676

yield

667

677

668

678

669

def consumev2(repo, fp, filecount, filesize):

679

def consumev2(repo, fp, filecount, filesize):

670

"""Apply the contents from a version 2 streaming clone.

680

"""Apply the contents from a version 2 streaming clone.

671

681

672

Data is read from an object that only needs to provide a ``read(size)``

682

Data is read from an object that only needs to provide a ``read(size)``

673

method.

683

method.

674

"""

684

"""

675

with repo.lock():

685

with repo.lock():

676

repo.ui.status(

686

repo.ui.status(

677

_(b'%d files to transfer, %s of data\n')

687

_(b'%d files to transfer, %s of data\n')

678

% (filecount, util.bytecount(filesize))

688

% (filecount, util.bytecount(filesize))

679

)

689

)

680

690

681

start = util.timer()

691

start = util.timer()

682

progress = repo.ui.makeprogress(

692

progress = repo.ui.makeprogress(

683

_(b'clone'), total=filesize, unit=_(b'bytes')

693

_(b'clone'), total=filesize, unit=_(b'bytes')

684

)

694

)

685

progress.update(0)

695

progress.update(0)

686

696

687

vfsmap = _makemap(repo)

697

vfsmap = _makemap(repo)

698

# we keep repo.vfs out of the on purpose, ther are too many danger

699

# there (eg: .hg/hgrc),

700

#

701

# this assert is duplicated (from _makemap) as author might think this

702

# is fine, while this is really not fine.

703

if repo.vfs in vfsmap.values():

704

raise error.ProgrammingError(

705

b'repo.vfs must not be added to vfsmap for security reasons'

706

)

688

707

689

with repo.transaction(b'clone'):

708

with repo.transaction(b'clone'):

690

ctxs = (vfs.backgroundclosing(repo.ui) for vfs in vfsmap.values())

709

ctxs = (vfs.backgroundclosing(repo.ui) for vfs in vfsmap.values())

691

with nested(*ctxs):

710

with nested(*ctxs):

692

for i in range(filecount):

711

for i in range(filecount):

693

src = util.readexactly(fp, 1)

712

src = util.readexactly(fp, 1)

694

vfs = vfsmap[src]

713

vfs = vfsmap[src]

695

namelen = util.uvarintdecodestream(fp)

714

namelen = util.uvarintdecodestream(fp)

696

datalen = util.uvarintdecodestream(fp)

715

datalen = util.uvarintdecodestream(fp)

697

716

698

name = util.readexactly(fp, namelen)

717

name = util.readexactly(fp, namelen)

699

718

700

if repo.ui.debugflag:

719

if repo.ui.debugflag:

701

repo.ui.debug(

720

repo.ui.debug(

702

b'adding [%s] %s (%s)\n'

721

b'adding [%s] %s (%s)\n'

703

% (src, name, util.bytecount(datalen))

722

% (src, name, util.bytecount(datalen))

704

)

723

)

705

724

706

with vfs(name, b'w') as ofp:

725

with vfs(name, b'w') as ofp:

707

for chunk in util.filechunkiter(fp, limit=datalen):

726

for chunk in util.filechunkiter(fp, limit=datalen):

708

progress.increment(step=len(chunk))

727

progress.increment(step=len(chunk))

709

ofp.write(chunk)

728

ofp.write(chunk)

710

729

711

# force @filecache properties to be reloaded from

730

# force @filecache properties to be reloaded from

712

# streamclone-ed file at next access

731

# streamclone-ed file at next access

713

repo.invalidate(clearfilecache=True)

732

repo.invalidate(clearfilecache=True)

714

733

715

elapsed = util.timer() - start

734

elapsed = util.timer() - start

716

if elapsed <= 0:

735

if elapsed <= 0:

717

elapsed = 0.001

736

elapsed = 0.001

718

repo.ui.status(

737

repo.ui.status(

719

_(b'transferred %s in %.1f seconds (%s/sec)\n')

738

_(b'transferred %s in %.1f seconds (%s/sec)\n')

720

% (

739

% (

721

util.bytecount(progress.pos),

740

util.bytecount(progress.pos),

722

elapsed,

741

elapsed,

723

util.bytecount(progress.pos / elapsed),

742

util.bytecount(progress.pos / elapsed),

724

)

743

)

725

)

744

)

726

progress.complete()

745

progress.complete()

727

746

728

747

729

def applybundlev2(repo, fp, filecount, filesize, requirements):

748

def applybundlev2(repo, fp, filecount, filesize, requirements):

730

from . import localrepo

749

from . import localrepo

731

750

732

missingreqs = [r for r in requirements if r not in repo.supported]

751

missingreqs = [r for r in requirements if r not in repo.supported]

733

if missingreqs:

752

if missingreqs:

734

raise error.Abort(

753

raise error.Abort(

735

_(b'unable to apply stream clone: unsupported format: %s')

754

_(b'unable to apply stream clone: unsupported format: %s')

736

% b', '.join(sorted(missingreqs))

755

% b', '.join(sorted(missingreqs))

737

)

756

)

738

757

739

consumev2(repo, fp, filecount, filesize)

758

consumev2(repo, fp, filecount, filesize)

740

759

741

# new requirements = old non-format requirements +

760

# new requirements = old non-format requirements +

742

# new format-related remote requirements

761

# new format-related remote requirements

743

# requirements from the streamed-in repository

762

# requirements from the streamed-in repository

744

repo.requirements = set(requirements) | (

763

repo.requirements = set(requirements) | (

745

repo.requirements - repo.supportedformats

764

repo.requirements - repo.supportedformats

746

)

765

)

747

repo.svfs.options = localrepo.resolvestorevfsoptions(

766

repo.svfs.options = localrepo.resolvestorevfsoptions(

748

repo.ui, repo.requirements, repo.features

767

repo.ui, repo.requirements, repo.features

749

)

768

)

750

scmutil.writereporequirements(repo)

769

scmutil.writereporequirements(repo)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # streamclone.py - producing and consuming streaming repository data
             #
             # Copyright 2015 Gregory Szorc <gregory.szorc@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import contextlib
             import os
             import struct
             from .i18n import _
             from .pycompat import open
             from .interfaces import repository
             from . import (
                 cacheutil,
                 error,
                 narrowspec,
                 phases,
                 pycompat,
                 requirements as requirementsmod,
                 scmutil,
                 store,
                 util,
             )
             def canperformstreamclone(pullop, bundle2=False):
                 """Whether it is possible to perform a streaming clone as part of pull.
                 ``bundle2`` will cause the function to consider stream clone through
                 bundle2 and only through bundle2.
                 Returns a tuple of (supported, requirements). ``supported`` is True if
                 streaming clone is supported and False otherwise. ``requirements`` is
                 a set of repo requirements from the remote, or ``None`` if stream clone
                 isn't supported.
                 """
                 repo = pullop.repo
                 remote = pullop.remote
                 bundle2supported = False
                 if pullop.canusebundle2:
                     if b'v2' in pullop.remotebundle2caps.get(b'stream', []):
                         bundle2supported = True
                     # else
                     # Server doesn't support bundle2 stream clone or doesn't support
                     # the versions we support. Fall back and possibly allow legacy.
                 # Ensures legacy code path uses available bundle2.
                 if bundle2supported and not bundle2:
                     return False, None
                 # Ensures bundle2 doesn't try to do a stream clone if it isn't supported.
                 elif bundle2 and not bundle2supported:
                     return False, None
                 # Streaming clone only works on empty repositories.
                 if len(repo):
                     return False, None
                 # Streaming clone only works if all data is being requested.
                 if pullop.heads:
                     return False, None
                 streamrequested = pullop.streamclonerequested
                 # If we don't have a preference, let the server decide for us. This
                 # likely only comes into play in LANs.
                 if streamrequested is None:
                     # The server can advertise whether to prefer streaming clone.
                     streamrequested = remote.capable(b'stream-preferred')
                 if not streamrequested:
                     return False, None
                 # In order for stream clone to work, the client has to support all the
                 # requirements advertised by the server.
                 #
                 # The server advertises its requirements via the "stream" and "streamreqs"
                 # capability. "stream" (a value-less capability) is advertised if and only
                 # if the only requirement is "revlogv1." Else, the "streamreqs" capability
                 # is advertised and contains a comma-delimited list of requirements.
                 requirements = set()
                 if remote.capable(b'stream'):
                     requirements.add(requirementsmod.REVLOGV1_REQUIREMENT)
                 else:
                     streamreqs = remote.capable(b'streamreqs')
                     # This is weird and shouldn't happen with modern servers.
                     if not streamreqs:
                         pullop.repo.ui.warn(
                             _(
                                 b'warning: stream clone requested but server has them '
                                 b'disabled\n'
                             )
                         )
                         return False, None
                     streamreqs = set(streamreqs.split(b','))
                     # Server requires something we don't support. Bail.
                     missingreqs = streamreqs - repo.supportedformats
                     if missingreqs:
                         pullop.repo.ui.warn(
                             _(
                                 b'warning: stream clone requested but client is missing '
                                 b'requirements: %s\n'
                             )
                             % b', '.join(sorted(missingreqs))
                         )
                         pullop.repo.ui.warn(
                             _(
                                 b'(see https://www.mercurial-scm.org/wiki/MissingRequirement '
                                 b'for more information)\n'
                             )
                         )
                         return False, None
                     requirements = streamreqs
                 return True, requirements
             def maybeperformlegacystreamclone(pullop):
                 """Possibly perform a legacy stream clone operation.
                 Legacy stream clones are performed as part of pull but before all other
                 operations.
                 A legacy stream clone will not be performed if a bundle2 stream clone is
                 supported.
                 """
                 from . import localrepo
                 supported, requirements = canperformstreamclone(pullop)
                 if not supported:
                     return
                 repo = pullop.repo
                 remote = pullop.remote
                 # Save remote branchmap. We will use it later to speed up branchcache
                 # creation.
                 rbranchmap = None
                 if remote.capable(b'branchmap'):
                     with remote.commandexecutor() as e:
                         rbranchmap = e.callcommand(b'branchmap', {}).result()
                 repo.ui.status(_(b'streaming all changes\n'))
                 with remote.commandexecutor() as e:
                     fp = e.callcommand(b'stream_out', {}).result()
                 # TODO strictly speaking, this code should all be inside the context
                 # manager because the context manager is supposed to ensure all wire state
                 # is flushed when exiting. But the legacy peers don't do this, so it
                 # doesn't matter.
                 l = fp.readline()
                 try:
                     resp = int(l)
                 except ValueError:
                     raise error.ResponseError(
                         _(b'unexpected response from remote server:'), l
                     )
                 if resp == 1:
                     raise error.Abort(_(b'operation forbidden by server'))
                 elif resp == 2:
                     raise error.Abort(_(b'locking the remote repository failed'))
                 elif resp != 0:
                     raise error.Abort(_(b'the server sent an unknown error code'))
                 l = fp.readline()
                 try:
                     filecount, bytecount = map(int, l.split(b' ', 1))
                 except (ValueError, TypeError):
                     raise error.ResponseError(
                         _(b'unexpected response from remote server:'), l
                     )
                 with repo.lock():
                     consumev1(repo, fp, filecount, bytecount)
                     # new requirements = old non-format requirements +
                     #                    new format-related remote requirements
                     # requirements from the streamed-in repository
                     repo.requirements = requirements | (
                         repo.requirements - repo.supportedformats
                     )
                     repo.svfs.options = localrepo.resolvestorevfsoptions(
                         repo.ui, repo.requirements, repo.features
                     )
                     scmutil.writereporequirements(repo)
                     if rbranchmap:
                         repo._branchcaches.replace(repo, rbranchmap)
                     repo.invalidate()
             def allowservergeneration(repo):
                 """Whether streaming clones are allowed from the server."""
                 if repository.REPO_FEATURE_STREAM_CLONE not in repo.features:
                     return False
                 if not repo.ui.configbool(b'server', b'uncompressed', untrusted=True):
                     return False
                 # The way stream clone works makes it impossible to hide secret changesets.
                 # So don't allow this by default.
                 secret = phases.hassecret(repo)
                 if secret:
                     return repo.ui.configbool(b'server', b'uncompressedallowsecret')
                 return True
             # This is it's own function so extensions can override it.
             def _walkstreamfiles(repo, matcher=None):
                 return repo.store.walk(matcher)
             def generatev1(repo):
                 """Emit content for version 1 of a streaming clone.
                 This returns a 3-tuple of (file count, byte size, data iterator).
                 The data iterator consists of N entries for each file being transferred.
                 Each file entry starts as a line with the file name and integer size
                 delimited by a null byte.
                 The raw file data follows. Following the raw file data is the next file
                 entry, or EOF.
                 When used on the wire protocol, an additional line indicating protocol
                 success will be prepended to the stream. This function is not responsible
                 for adding it.
                 This function will obtain a repository lock to ensure a consistent view of
                 the store is captured. It therefore may raise LockError.
                 """
                 entries = []
                 total_bytes = 0
                 # Get consistent snapshot of repo, lock during scan.
                 with repo.lock():
                     repo.ui.debug(b'scanning\n')
                     for file_type, name, ename, size in _walkstreamfiles(repo):
                         if size:
                             entries.append((name, size))
                             total_bytes += size
                     _test_sync_point_walk_1(repo)
                 _test_sync_point_walk_2(repo)
                 repo.ui.debug(
                     b'%d files, %d bytes to transfer\n' % (len(entries), total_bytes)
                 )
                 svfs = repo.svfs
                 debugflag = repo.ui.debugflag
                 def emitrevlogdata():
                     for name, size in entries:
                         if debugflag:
                             repo.ui.debug(b'sending %s (%d bytes)\n' % (name, size))
                         # partially encode name over the wire for backwards compat
                         yield b'%s\0%d\n' % (store.encodedir(name), size)
                         # auditing at this stage is both pointless (paths are already
                         # trusted by the local repo) and expensive
                         with svfs(name, b'rb', auditpath=False) as fp:
                             if size <= 65536:
                                 yield fp.read(size)
                             else:
                                 for chunk in util.filechunkiter(fp, limit=size):
                                     yield chunk
                 return len(entries), total_bytes, emitrevlogdata()
             def generatev1wireproto(repo):
                 """Emit content for version 1 of streaming clone suitable for the wire.
                 This is the data output from ``generatev1()`` with 2 header lines. The
                 first line indicates overall success. The 2nd contains the file count and
                 byte size of payload.
                 The success line contains "0" for success, "1" for stream generation not
                 allowed, and "2" for error locking the repository (possibly indicating
                 a permissions error for the server process).
                 """
                 if not allowservergeneration(repo):
                     yield b'1\n'
                     return
                 try:
                     filecount, bytecount, it = generatev1(repo)
                 except error.LockError:
                     yield b'2\n'
                     return
                 # Indicates successful response.
                 yield b'0\n'
                 yield b'%d %d\n' % (filecount, bytecount)
                 for chunk in it:
                     yield chunk
             def generatebundlev1(repo, compression=b'UN'):
                 """Emit content for version 1 of a stream clone bundle.
                 The first 4 bytes of the output ("HGS1") denote this as stream clone
                 bundle version 1.
                 The next 2 bytes indicate the compression type. Only "UN" is currently
                 supported.
                 The next 16 bytes are two 64-bit big endian unsigned integers indicating
                 file count and byte count, respectively.
                 The next 2 bytes is a 16-bit big endian unsigned short declaring the length
                 of the requirements string, including a trailing \0. The following N bytes
                 are the requirements string, which is ASCII containing a comma-delimited
                 list of repo requirements that are needed to support the data.
                 The remaining content is the output of ``generatev1()`` (which may be
                 compressed in the future).
                 Returns a tuple of (requirements, data generator).
                 """
                 if compression != b'UN':
                     raise ValueError(b'we do not support the compression argument yet')
                 requirements = repo.requirements & repo.supportedformats
                 requires = b','.join(sorted(requirements))
                 def gen():
                     yield b'HGS1'
                     yield compression
                     filecount, bytecount, it = generatev1(repo)
                     repo.ui.status(
                         _(b'writing %d bytes for %d files\n') % (bytecount, filecount)
                     )
                     yield struct.pack(b'>QQ', filecount, bytecount)
                     yield struct.pack(b'>H', len(requires) + 1)
                     yield requires + b'\0'
                     # This is where we'll add compression in the future.
                     assert compression == b'UN'
                     progress = repo.ui.makeprogress(
                         _(b'bundle'), total=bytecount, unit=_(b'bytes')
                     )
                     progress.update(0)
                     for chunk in it:
                         progress.increment(step=len(chunk))
                         yield chunk
                     progress.complete()
                 return requirements, gen()
             def consumev1(repo, fp, filecount, bytecount):
                 """Apply the contents from version 1 of a streaming clone file handle.
                 This takes the output from "stream_out" and applies it to the specified
                 repository.
                 Like "stream_out," the status line added by the wire protocol is not
                 handled by this function.
                 """
                 with repo.lock():
                     repo.ui.status(
                         _(b'%d files to transfer, %s of data\n')
                         % (filecount, util.bytecount(bytecount))
                     )
                     progress = repo.ui.makeprogress(
                         _(b'clone'), total=bytecount, unit=_(b'bytes')
                     )
                     progress.update(0)
                     start = util.timer()
                     # TODO: get rid of (potential) inconsistency
                     #
                     # If transaction is started and any @filecache property is
                     # changed at this point, it causes inconsistency between
                     # in-memory cached property and streamclone-ed file on the
                     # disk. Nested transaction prevents transaction scope "clone"
                     # below from writing in-memory changes out at the end of it,
                     # even though in-memory changes are discarded at the end of it
                     # regardless of transaction nesting.
                     #
                     # But transaction nesting can't be simply prohibited, because
                     # nesting occurs also in ordinary case (e.g. enabling
                     # clonebundles).
                     with repo.transaction(b'clone'):
                         with repo.svfs.backgroundclosing(repo.ui, expectedcount=filecount):
                             for i in pycompat.xrange(filecount):
                                 # XXX doesn't support '\n' or '\r' in filenames
                                 l = fp.readline()
                                 try:
                                     name, size = l.split(b'\0', 1)
                                     size = int(size)
                                 except (ValueError, TypeError):
                                     raise error.ResponseError(
                                         _(b'unexpected response from remote server:'), l
                                     )
                                 if repo.ui.debugflag:
                                     repo.ui.debug(
                                         b'adding %s (%s)\n' % (name, util.bytecount(size))
                                     )
                                 # for backwards compat, name was partially encoded
                                 path = store.decodedir(name)
                                 with repo.svfs(path, b'w', backgroundclose=True) as ofp:
                                     for chunk in util.filechunkiter(fp, limit=size):
                                         progress.increment(step=len(chunk))
                                         ofp.write(chunk)
                         # force @filecache properties to be reloaded from
                         # streamclone-ed file at next access
                         repo.invalidate(clearfilecache=True)
                     elapsed = util.timer() - start
                     if elapsed <= 0:
                         elapsed = 0.001
                     progress.complete()
                     repo.ui.status(
                         _(b'transferred %s in %.1f seconds (%s/sec)\n')
                         % (
                             util.bytecount(bytecount),
                             elapsed,
                             util.bytecount(bytecount / elapsed),
                         )
                     )
             def readbundle1header(fp):
                 compression = fp.read(2)
                 if compression != b'UN':
                     raise error.Abort(
                         _(
                             b'only uncompressed stream clone bundles are '
                             b'supported; got %s'
                         )
                         % compression
                     )
                 filecount, bytecount = struct.unpack(b'>QQ', fp.read(16))
                 requireslen = struct.unpack(b'>H', fp.read(2))[0]
                 requires = fp.read(requireslen)
                 if not requires.endswith(b'\0'):
                     raise error.Abort(
                         _(
                             b'malformed stream clone bundle: '
                             b'requirements not properly encoded'
                         )
                     )
                 requirements = set(requires.rstrip(b'\0').split(b','))
                 return filecount, bytecount, requirements
             def applybundlev1(repo, fp):
                 """Apply the content from a stream clone bundle version 1.
                 We assume the 4 byte header has been read and validated and the file handle
                 is at the 2 byte compression identifier.
                 """
                 if len(repo):
                     raise error.Abort(
                         _(b'cannot apply stream clone bundle on non-empty repo')
                     )
                 filecount, bytecount, requirements = readbundle1header(fp)
                 missingreqs = requirements - repo.supportedformats
                 if missingreqs:
                     raise error.Abort(
                         _(b'unable to apply stream clone: unsupported format: %s')
                         % b', '.join(sorted(missingreqs))
                     )
                 consumev1(repo, fp, filecount, bytecount)
             class streamcloneapplier(object):
                 """Class to manage applying streaming clone bundles.
                 We need to wrap ``applybundlev1()`` in a dedicated type to enable bundle
                 readers to perform bundle type-specific functionality.
                 """
                 def __init__(self, fh):
                     self._fh = fh
                 def apply(self, repo):
                     return applybundlev1(repo, self._fh)
             # type of file to stream
             _fileappend = 0  # append only file
             _filefull = 1  # full snapshot file
             # Source of the file
             _srcstore = b's'  # store (svfs)
             _srccache = b'c'  # cache (cache)
             # This is it's own function so extensions can override it.
             def _walkstreamfullstorefiles(repo):
                 """list snapshot file from the store"""
                 fnames = []
                 if not repo.publishing():
                     fnames.append(b'phaseroots')
                 return fnames
             def _filterfull(entry, copy, vfsmap):
                 """actually copy the snapshot files"""
                 src, name, ftype, data = entry
                 if ftype != _filefull:
                     return entry
                 return (src, name, ftype, copy(vfsmap[src].join(name)))
             @contextlib.contextmanager
             def maketempcopies():
                 """return a function to temporary copy file"""
                 files = []
                 try:
                     def copy(src):
                         fd, dst = pycompat.mkstemp()
                         os.close(fd)
                         files.append(dst)
                         util.copyfiles(src, dst, hardlink=True)
                         return dst
                     yield copy
                 finally:
                     for tmp in files:
                         util.tryunlink(tmp)
             def _makemap(repo):
                 """make a (src -> vfs) map for the repo"""
                 vfsmap = {
                     _srcstore: repo.svfs,
                     _srccache: repo.cachevfs,
                 }
                 # we keep repo.vfs out of the on purpose, ther are too many danger there
                 # (eg: .hg/hgrc)
                 assert repo.vfs not in vfsmap.values()
                 return vfsmap
             def _emit2(repo, entries, totalfilesize):
                 """actually emit the stream bundle"""
                 vfsmap = _makemap(repo)
+                # we keep repo.vfs out of the on purpose, ther are too many danger there
+                # (eg: .hg/hgrc),
+                #
+                # this assert is duplicated (from _makemap) as author might think this is
+                # fine, while this is really not fine.
+                if repo.vfs in vfsmap.values():
+                    raise error.ProgrammingError(
+                        b'repo.vfs must not be added to vfsmap for security reasons'
+                    )
                 progress = repo.ui.makeprogress(
                     _(b'bundle'), total=totalfilesize, unit=_(b'bytes')
                 )
                 progress.update(0)
                 with maketempcopies() as copy, progress:
                     # copy is delayed until we are in the try
                     entries = [_filterfull(e, copy, vfsmap) for e in entries]
                     yield None  # this release the lock on the repository
                     seen = 0
                     for src, name, ftype, data in entries:
                         vfs = vfsmap[src]
                         yield src
                         yield util.uvarintencode(len(name))
                         if ftype == _fileappend:
                             fp = vfs(name)
                             size = data
                         elif ftype == _filefull:
                             fp = open(data, b'rb')
                             size = util.fstat(fp).st_size
                         try:
                             yield util.uvarintencode(size)
                             yield name
                             if size <= 65536:
                                 chunks = (fp.read(size),)
                             else:
                                 chunks = util.filechunkiter(fp, limit=size)
                             for chunk in chunks:
                                 seen += len(chunk)
                                 progress.update(seen)
                                 yield chunk
                         finally:
                             fp.close()
             def _test_sync_point_walk_1(repo):
                 """a function for synchronisation during tests"""
             def _test_sync_point_walk_2(repo):
                 """a function for synchronisation during tests"""
             def generatev2(repo, includes, excludes, includeobsmarkers):
                 """Emit content for version 2 of a streaming clone.
                 the data stream consists the following entries:
 ) A char representing the file destination (eg: store or cache)
 ) A varint containing the length of the filename
 ) A varint containing the length of file data
 ) N bytes containing the filename (the internal, store-agnostic form)
 ) N bytes containing the file data
                 Returns a 3-tuple of (file count, file size, data iterator).
                 """
                 with repo.lock():
                     entries = []
                     totalfilesize = 0
                     matcher = None
                     if includes or excludes:
                         matcher = narrowspec.match(repo.root, includes, excludes)
                     repo.ui.debug(b'scanning\n')
                     for rl_type, name, ename, size in _walkstreamfiles(repo, matcher):
                         if size:
                             ft = _fileappend
                             if rl_type & store.FILEFLAGS_VOLATILE:
                                 ft = _filefull
                             entries.append((_srcstore, name, ft, size))
                             totalfilesize += size
                     for name in _walkstreamfullstorefiles(repo):
                         if repo.svfs.exists(name):
                             totalfilesize += repo.svfs.lstat(name).st_size
                             entries.append((_srcstore, name, _filefull, None))
                     if includeobsmarkers and repo.svfs.exists(b'obsstore'):
                         totalfilesize += repo.svfs.lstat(b'obsstore').st_size
                         entries.append((_srcstore, b'obsstore', _filefull, None))
                     for name in cacheutil.cachetocopy(repo):
                         if repo.cachevfs.exists(name):
                             totalfilesize += repo.cachevfs.lstat(name).st_size
                             entries.append((_srccache, name, _filefull, None))
                     chunks = _emit2(repo, entries, totalfilesize)
                     first = next(chunks)
                     assert first is None
                     _test_sync_point_walk_1(repo)
                 _test_sync_point_walk_2(repo)
                 return len(entries), totalfilesize, chunks
             @contextlib.contextmanager
             def nested(*ctxs):
                 this = ctxs[0]
                 rest = ctxs[1:]
                 with this:
                     if rest:
                         with nested(*rest):
                             yield
                     else:
                         yield
             def consumev2(repo, fp, filecount, filesize):
                 """Apply the contents from a version 2 streaming clone.
                 Data is read from an object that only needs to provide a ``read(size)``
                 method.
                 """
                 with repo.lock():
                     repo.ui.status(
                         _(b'%d files to transfer, %s of data\n')
                         % (filecount, util.bytecount(filesize))
                     )
                     start = util.timer()
                     progress = repo.ui.makeprogress(
                         _(b'clone'), total=filesize, unit=_(b'bytes')
                     )
                     progress.update(0)
                     vfsmap = _makemap(repo)
+                    # we keep repo.vfs out of the on purpose, ther are too many danger
+                    # there (eg: .hg/hgrc),
+                    #
+                    # this assert is duplicated (from _makemap) as author might think this
+                    # is fine, while this is really not fine.
+                    if repo.vfs in vfsmap.values():
+                        raise error.ProgrammingError(
+                            b'repo.vfs must not be added to vfsmap for security reasons'
+                        )
                     with repo.transaction(b'clone'):
                         ctxs = (vfs.backgroundclosing(repo.ui) for vfs in vfsmap.values())
                         with nested(*ctxs):
                             for i in range(filecount):
                                 src = util.readexactly(fp, 1)
                                 vfs = vfsmap[src]
                                 namelen = util.uvarintdecodestream(fp)
                                 datalen = util.uvarintdecodestream(fp)
                                 name = util.readexactly(fp, namelen)
                                 if repo.ui.debugflag:
                                     repo.ui.debug(
                                         b'adding [%s] %s (%s)\n'
                                         % (src, name, util.bytecount(datalen))
                                     )
                                 with vfs(name, b'w') as ofp:
                                     for chunk in util.filechunkiter(fp, limit=datalen):
                                         progress.increment(step=len(chunk))
                                         ofp.write(chunk)
                         # force @filecache properties to be reloaded from
                         # streamclone-ed file at next access
                         repo.invalidate(clearfilecache=True)
                     elapsed = util.timer() - start
                     if elapsed <= 0:
                         elapsed = 0.001
                     repo.ui.status(
                         _(b'transferred %s in %.1f seconds (%s/sec)\n')
                         % (
                             util.bytecount(progress.pos),
                             elapsed,
                             util.bytecount(progress.pos / elapsed),
                         )
                     )
                     progress.complete()
             def applybundlev2(repo, fp, filecount, filesize, requirements):
                 from . import localrepo
                 missingreqs = [r for r in requirements if r not in repo.supported]
                 if missingreqs:
                     raise error.Abort(
                         _(b'unable to apply stream clone: unsupported format: %s')
                         % b', '.join(sorted(missingreqs))
                     )
                 consumev2(repo, fp, filecount, filesize)
                 # new requirements = old non-format requirements +
                 #                    new format-related remote requirements
                 # requirements from the streamed-in repository
                 repo.requirements = set(requirements) | (
                     repo.requirements - repo.supportedformats
                 )
                 repo.svfs.options = localrepo.resolvestorevfsoptions(
                     repo.ui, repo.requirements, repo.features
                 )
                 scmutil.writereporequirements(repo)